Merge branch 'master' of ssh://git@gitorious.org/yacy/rc1.git

pull/1/head
Michael Peter Christen 11 years ago
commit d4f65833a1

@ -97,6 +97,7 @@ public class ContentScraper extends AbstractScraper implements Scraper {
embed(TagType.singleton), //added by [MN] embed(TagType.singleton), //added by [MN]
param(TagType.singleton), //added by [MN] param(TagType.singleton), //added by [MN]
iframe(TagType.singleton), // scraped as singleton to get such iframes that have no closing tag iframe(TagType.singleton), // scraped as singleton to get such iframes that have no closing tag
source(TagType.singleton), // html5 (part of <video> <audio>) - scaped like embed
a(TagType.pair), a(TagType.pair),
h1(TagType.pair), h1(TagType.pair),
@ -463,7 +464,7 @@ public class ContentScraper extends AbstractScraper implements Scraper {
this.anchors.add(newLink); this.anchors.add(newLink);
} }
} }
} else if(tag.name.equalsIgnoreCase("embed")) { } else if(tag.name.equalsIgnoreCase("embed") || tag.name.equalsIgnoreCase("source")) { //html5 tag
final String src = tag.opts.getProperty("src", EMPTY_STRING); final String src = tag.opts.getProperty("src", EMPTY_STRING);
try { try {
if (src.length() > 0) { if (src.length() > 0) {

Loading…
Cancel
Save