From 360a460da83bf23f9a1e6191616ff82c227bd92c Mon Sep 17 00:00:00 2001 From: hydrox Date: Sun, 12 Mar 2006 18:08:48 +0000 Subject: [PATCH] *)URL-Cleaner: moved logging-statement to correct position *)plasmaURLPattern: host is now added to the hashset in lowercase git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@1879 6c8d7289-2bf4-0310-a012-ef5d649a1542 --- source/de/anomic/plasma/plasmaCrawlLURL.java | 6 +++--- source/de/anomic/plasma/plasmaURLPattern.java | 2 +- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/source/de/anomic/plasma/plasmaCrawlLURL.java b/source/de/anomic/plasma/plasmaCrawlLURL.java index f41da491d..7a0121b5b 100644 --- a/source/de/anomic/plasma/plasmaCrawlLURL.java +++ b/source/de/anomic/plasma/plasmaCrawlLURL.java @@ -816,12 +816,12 @@ public final class plasmaCrawlLURL extends plasmaURL { lastBlacklistedHash = entry.hash(); serverLog.logFine("URLDBCLEANER", ++blacklistedUrls + " blacklisted (" + ((double)blacklistedUrls/totalSearchedUrls)*100 + "%): " + entry.hash() + " " + entry.url()); remove(entry.hash()); + if (blacklistedUrls % 100 == 0) { + serverLog.logInfo("URLDBCLEANER", "Deleted " + blacklistedUrls + " URLs until now. Last deleted URL-Hash: " + lastBlacklistedUrl); + } } lastUrl = entry.url().toString(); lastHash = entry.hash(); - if (blacklistedUrls % 100 == 0 && blacklistedUrls != 0) { - serverLog.logInfo("URLDBCLEANER", "Deleted " + blacklistedUrls + " URLs until now. Last deleted URL-Hash: " + lastBlacklistedUrl); - } } } catch (RuntimeException e) { if (e.getMessage().indexOf("not found in LURL") != -1) { diff --git a/source/de/anomic/plasma/plasmaURLPattern.java b/source/de/anomic/plasma/plasmaURLPattern.java index 6ae115a5f..540cf9bc1 100644 --- a/source/de/anomic/plasma/plasmaURLPattern.java +++ b/source/de/anomic/plasma/plasmaURLPattern.java @@ -81,7 +81,7 @@ public class plasmaURLPattern { public void add(String host, String path) { if (path.length() > 0 && path.charAt(0) == '/') path = path.substring(1); - hostpaths.put(host, path); + hostpaths.put(host.toLowerCase(), path); } public boolean isListed(String hostlow, String path) {