From 17ae51e741abb7d60593a2e7e378895324e67457 Mon Sep 17 00:00:00 2001 From: orbiter Date: Sun, 17 Mar 2013 22:13:56 +0100 Subject: [PATCH] increased number of links limitation from 1000 to 10000 for rss feeds and html documents --- defaults/solr.webgraph.schema | 2 +- source/net/yacy/cora/document/RSSFeed.java | 2 +- source/net/yacy/document/parser/htmlParser.java | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/defaults/solr.webgraph.schema b/defaults/solr.webgraph.schema index f7fb37f76..dec0dcb02 100644 --- a/defaults/solr.webgraph.schema +++ b/defaults/solr.webgraph.schema @@ -156,7 +156,7 @@ target_path_folders_sxt ## the values from key-value pairs in the search part of the url (target) #target_parameter_value_sxt -## "depth of web page according to number of clicks from the 'main' page, which is the page that appears if only the host is entered as url (target) +## depth of web page according to number of clicks from the 'main' page, which is the page that appears if only the host is entered as url (target) #target_clickdepth_i ## host of the url (target) diff --git a/source/net/yacy/cora/document/RSSFeed.java b/source/net/yacy/cora/document/RSSFeed.java index bb65405da..cb688e39a 100644 --- a/source/net/yacy/cora/document/RSSFeed.java +++ b/source/net/yacy/cora/document/RSSFeed.java @@ -31,7 +31,7 @@ import java.util.Set; public class RSSFeed implements Iterable { - public static final int DEFAULT_MAXSIZE = 1000; + public static final int DEFAULT_MAXSIZE = 10000; // class variables private RSSMessage channel; diff --git a/source/net/yacy/document/parser/htmlParser.java b/source/net/yacy/document/parser/htmlParser.java index fe0bd8184..a8d84a39b 100644 --- a/source/net/yacy/document/parser/htmlParser.java +++ b/source/net/yacy/document/parser/htmlParser.java @@ -51,7 +51,7 @@ import com.ibm.icu.text.CharsetDetector; public class htmlParser extends AbstractParser implements Parser { private static final Pattern patternUnderline = Pattern.compile("_"); - private static final int maxLinks = 1000; + private static final int maxLinks = 10000; public htmlParser() { super("Streaming HTML Parser");