*)URL-Cleaner: moved logging-statement to correct position

*)plasmaURLPattern: host is now added to the hashset in lowercase

git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@1879 6c8d7289-2bf4-0310-a012-ef5d649a1542
pull/1/head
hydrox 19 years ago
parent 02f9765013
commit 360a460da8

@ -816,12 +816,12 @@ public final class plasmaCrawlLURL extends plasmaURL {
lastBlacklistedHash = entry.hash(); lastBlacklistedHash = entry.hash();
serverLog.logFine("URLDBCLEANER", ++blacklistedUrls + " blacklisted (" + ((double)blacklistedUrls/totalSearchedUrls)*100 + "%): " + entry.hash() + " " + entry.url()); serverLog.logFine("URLDBCLEANER", ++blacklistedUrls + " blacklisted (" + ((double)blacklistedUrls/totalSearchedUrls)*100 + "%): " + entry.hash() + " " + entry.url());
remove(entry.hash()); remove(entry.hash());
if (blacklistedUrls % 100 == 0) {
serverLog.logInfo("URLDBCLEANER", "Deleted " + blacklistedUrls + " URLs until now. Last deleted URL-Hash: " + lastBlacklistedUrl);
}
} }
lastUrl = entry.url().toString(); lastUrl = entry.url().toString();
lastHash = entry.hash(); lastHash = entry.hash();
if (blacklistedUrls % 100 == 0 && blacklistedUrls != 0) {
serverLog.logInfo("URLDBCLEANER", "Deleted " + blacklistedUrls + " URLs until now. Last deleted URL-Hash: " + lastBlacklistedUrl);
}
} }
} catch (RuntimeException e) { } catch (RuntimeException e) {
if (e.getMessage().indexOf("not found in LURL") != -1) { if (e.getMessage().indexOf("not found in LURL") != -1) {

@ -81,7 +81,7 @@ public class plasmaURLPattern {
public void add(String host, String path) { public void add(String host, String path) {
if (path.length() > 0 && path.charAt(0) == '/') path = path.substring(1); if (path.length() > 0 && path.charAt(0) == '/') path = path.substring(1);
hostpaths.put(host, path); hostpaths.put(host.toLowerCase(), path);
} }
public boolean isListed(String hostlow, String path) { public boolean isListed(String hostlow, String path) {

Loading…
Cancel
Save