Avoid stopwords as topwords, configurable

git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@3454 6c8d7289-2bf4-0310-a012-ef5d649a1542
pull/1/head
rramthun 18 years ago
parent d755a8026d
commit 045d758537

@ -367,6 +367,13 @@ public class yacysearch {
kelondroMSetTools.excludeDestructive(topwords, plasmaSwitchboard.badwords); kelondroMSetTools.excludeDestructive(topwords, plasmaSwitchboard.badwords);
} }
//avoid stopwords being topwords
if (env.getConfig("filterOutStopwordsFromTopwords", "true").equals("true")) {
if ((plasmaSwitchboard.stopwords != null) && (plasmaSwitchboard.stopwords.size() > 0)) {
kelondroMSetTools.excludeDestructive(topwords, plasmaSwitchboard.stopwords);
}
}
String word; String word;
hintcount = 0; hintcount = 0;
final Iterator iter = topwords.iterator(); final Iterator iter = topwords.iterator();

@ -462,6 +462,11 @@ xsstopw=true
xdstopw=true xdstopw=true
xpstopw=true xpstopw=true
# Topwords filtering
# If set to true, all stopwords (stopwords.yacy) are filtered from the topwords
# Change to false if requesting hits from peers with modified stopwords-file and using the unchanged client-version
filterOutStopwordsFromTopwords=true
# performance-settings # performance-settings
# delay-times for permanent loops (milliseconds) # delay-times for permanent loops (milliseconds)
# the idlesleep is the pause that an proces sleeps if the last call to the # the idlesleep is the pause that an proces sleeps if the last call to the

Loading…
Cancel
Save