From a512aef6adf2fa582c2ed8de50be3de37dbcb753 Mon Sep 17 00:00:00 2001 From: orbiter Date: Fri, 29 Jan 2010 10:33:20 +0000 Subject: [PATCH] fix for http://forum.yacy-websuche.de/viewtopic.php?p=18918#p18918 git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6629 6c8d7289-2bf4-0310-a012-ef5d649a1542 --- source/de/anomic/search/MetadataRepository.java | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/source/de/anomic/search/MetadataRepository.java b/source/de/anomic/search/MetadataRepository.java index 25c750bdf..90b8e5aba 100644 --- a/source/de/anomic/search/MetadataRepository.java +++ b/source/de/anomic/search/MetadataRepository.java @@ -364,7 +364,10 @@ public final class MetadataRepository implements Iterable { } else { final URIMetadataRow.Components metadata = entry.metadata(); totalSearchedUrls++; - if (metadata.url() == null) { + if (metadata == null) { + if (Log.isFine("URLDBCLEANER")) Log.logFine("URLDBCLEANER", "corrupted entry for hash = " + entry.hash()); + remove(entry.hash()); + } else if (metadata.url() == null) { if (Log.isFine("URLDBCLEANER")) Log.logFine("URLDBCLEANER", ++blacklistedUrls + " blacklisted (" + ((double) blacklistedUrls / totalSearchedUrls) * 100 + "%): " + entry.hash() + "URL == null"); remove(entry.hash()); } else if (blacklist.isListed(Blacklist.BLACKLIST_CRAWLER, metadata.url()) ||