add link extraction to pdfParser

this extracts clickable links in pdf and adds it to the list of links include a test case for this function this is the corrected comment for commit: aa2e15d846
11 years ago · 59c6532a65
parent aa2e15d846
commit 59c6532a65
1 changed files with 1 additions and 1 deletions
--- a/source/net/yacy/document/parser/pdfParser.java
+++ b/source/net/yacy/document/parser/pdfParser.java
@ -173,7 +173,7 @@ public class pdfParser extends AbstractParser implements Parser {
            contentBytes = writer.getBytes(); // get final text before closing writer
            pdflinks = extractPdfLinks(pdfDoc);
        } catch (final Throwable e) {
-            // close the writer (in finally)
+            //close the writer (in finally)
            //throw new Parser.Failure(e.getMessage(), location);
        } finally {
            try {pdfDoc.close();} catch (final Throwable e) {}