From a025b1da89f87719a3d89fdcb796945bbd8ba248 Mon Sep 17 00:00:00 2001 From: f1ori Date: Mon, 15 Nov 2010 14:47:16 +0000 Subject: [PATCH] * fix bug when browsing local filesystem (e. g. repository) with yacy git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@7323 6c8d7289-2bf4-0310-a012-ef5d649a1542 --- source/net/yacy/document/parser/html/ContentScraper.java | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/source/net/yacy/document/parser/html/ContentScraper.java b/source/net/yacy/document/parser/html/ContentScraper.java index ce9cd9556..a3dfe8a16 100644 --- a/source/net/yacy/document/parser/html/ContentScraper.java +++ b/source/net/yacy/document/parser/html/ContentScraper.java @@ -547,7 +547,9 @@ public class ContentScraper extends AbstractScraper implements Scraper { // scrape document to look up charset final ScraperInputStream htmlFilter = new ScraperInputStream(new ByteArrayInputStream(page),"UTF-8", new MultiProtocolURI("http://localhost"),null,false); - final String charset = htmlParser.patchCharsetEncoding(htmlFilter.detectCharset()); + String charset = htmlParser.patchCharsetEncoding(htmlFilter.detectCharset()); + if(charset == null) + charset = Charset.defaultCharset().toString(); // scrape content final ContentScraper scraper = new ContentScraper(new MultiProtocolURI("http://localhost"));