fix parser test cases

(Vocabulary paramete)
pull/1/head
reger 10 years ago
parent df83fcc4fc
commit 77851fa53c

@ -36,7 +36,7 @@ public class ParserTest {
final AnchorURL url = new AnchorURL("http://localhost/"+filename);
AbstractParser p = new ooxmlParser();
final Document[] docs = p.parse(url, mimetype, null, new FileInputStream(file));
final Document[] docs = p.parse(url, mimetype, null, null, new FileInputStream(file));
for (final Document doc: docs) {
final Reader content = new InputStreamReader(doc.getTextStream(), doc.getCharset());
final StringBuilder str = new StringBuilder();
@ -70,7 +70,7 @@ public class ParserTest {
final AnchorURL url = new AnchorURL("http://localhost/"+filename);
AbstractParser p = new odtParser();
final Document[] docs = p.parse(url, mimetype, null, new FileInputStream(file));
final Document[] docs = p.parse(url, mimetype, null, null, new FileInputStream(file));
for (final Document doc: docs) {
final Reader content = new InputStreamReader(doc.getTextStream(), doc.getCharset());
final StringBuilder str = new StringBuilder();
@ -102,7 +102,7 @@ public class ParserTest {
final AnchorURL url = new AnchorURL("http://localhost/"+filename);
AbstractParser p = new pdfParser();
final Document[] docs = p.parse(url, mimetype, null, new FileInputStream(file));
final Document[] docs = p.parse(url, mimetype, null, null, new FileInputStream(file));
for (final Document doc: docs) {
final Reader content = new InputStreamReader(doc.getTextStream(), doc.getCharset());
final StringBuilder str = new StringBuilder();
@ -134,7 +134,7 @@ public class ParserTest {
final AnchorURL url = new AnchorURL("http://localhost/"+filename);
AbstractParser p = new docParser();
final Document[] docs = p.parse(url, mimetype, null, new FileInputStream(file));
final Document[] docs = p.parse(url, mimetype, null, null, new FileInputStream(file));
for (final Document doc: docs) {
final Reader content = new InputStreamReader(doc.getTextStream(), doc.getCharset());
final StringBuilder str = new StringBuilder();
@ -172,7 +172,7 @@ public class ParserTest {
final AnchorURL url = new AnchorURL("http://localhost/" + filename);
AbstractParser p = new pptParser();
final Document[] docs = p.parse(url, mimetype, null, new FileInputStream(file));
final Document[] docs = p.parse(url, mimetype, null, null, new FileInputStream(file));
for (final Document doc : docs) {
final Reader content = new InputStreamReader(doc.getTextStream(), doc.getCharset());
final StringBuilder str = new StringBuilder();

@ -10,6 +10,7 @@ import junit.framework.TestCase;
import net.yacy.cora.document.id.AnchorURL;
import net.yacy.document.Document;
import net.yacy.document.Parser;
import net.yacy.document.VocabularyScraper;
import net.yacy.document.parser.html.ContentScraper;
import net.yacy.document.parser.html.ImageEntry;
import static net.yacy.document.parser.htmlParser.parseToScraper;
@ -74,7 +75,7 @@ public class htmlParserTest extends TestCase {
System.out.println("parse file: " + filename);
htmlParser p = new htmlParser();
final Document[] docs = p.parse(url, mimetype, null, new FileInputStream(file));
final Document[] docs = p.parse(url, mimetype, null, null, new FileInputStream(file));
Document doc = docs[0];
String txt = doc.getCharset();
@ -100,7 +101,7 @@ public class htmlParserTest extends TestCase {
+ "<figure><img width=\"550px\" title=\"image as exemple\" alt=\"image as exemple\" src=\"./img/my_image.png\"></figrue>" // + img width 550 (+html5 figure)
+ "</body></html>";
ContentScraper scraper = parseToScraper(url, mimetype, testhtml, 10);
ContentScraper scraper = parseToScraper(url, mimetype, new VocabularyScraper(), testhtml, 10);
List<AnchorURL> anchorlist = scraper.getAnchors();
String linktxt = anchorlist.get(0).getTextProperty();

@ -28,7 +28,7 @@ public class genericImageParserTest {
System.out.println("parse file: " + filename);
genericImageParser p = new genericImageParser();
final Document[] docs = p.parse(url, mimetype, charset, new FileInputStream(file));
final Document[] docs = p.parse(url, mimetype, charset, null, new FileInputStream(file));
Document doc = docs[0];
assertEquals("YaCy Logo",doc.dc_title());

@ -29,7 +29,7 @@ public class metadataImageParserTest {
System.out.println("parse file: " + filename);
metadataImageParser p = new metadataImageParser();
final Document[] docs = p.parse(url, mimetype, charset, new FileInputStream(file));
final Document[] docs = p.parse(url, mimetype, charset, null, new FileInputStream(file));
Document doc = docs[0];
assertEquals("YaCy Logo",doc.dc_title());

@ -29,7 +29,7 @@ public class pdfParserTest {
System.out.println("parse file: " + filename);
pdfParser p = new pdfParser();
final Document[] docs = p.parse(url, mimetype, charset, new FileInputStream(file));
final Document[] docs = p.parse(url, mimetype, charset, null, new FileInputStream(file));
Document doc = docs[0];
int ilinks = doc.getAnchors().size();

@ -5,6 +5,7 @@ import net.yacy.cora.document.encoding.ASCII;
import net.yacy.cora.document.id.DigestURL;
import net.yacy.cora.federate.yacy.CacheStrategy;
import net.yacy.cora.storage.HandleSet;
import net.yacy.cora.util.CommonPattern;
import net.yacy.kelondro.data.meta.URIMetadataNode;
import net.yacy.search.query.QueryGoal;
import net.yacy.search.schema.CollectionSchema;

Loading…
Cancel
Save