Merge branch 'master' of https://github.com/yacy/yacy_search_server.git
commit
079112358c
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
@ -0,0 +1,57 @@
|
||||
package net.yacy.document.parser;
|
||||
|
||||
import java.io.File;
|
||||
import java.io.FileInputStream;
|
||||
import java.io.InputStreamReader;
|
||||
import java.io.Reader;
|
||||
import net.yacy.cora.document.id.AnchorURL;
|
||||
import net.yacy.document.AbstractParser;
|
||||
import net.yacy.document.Document;
|
||||
import net.yacy.document.VocabularyScraper;
|
||||
import static org.hamcrest.CoreMatchers.containsString;
|
||||
import org.junit.Test;
|
||||
import static org.junit.Assert.*;
|
||||
|
||||
public class xlsParserTest {
|
||||
|
||||
/**
|
||||
* Test of parse method, of class xlsParser.
|
||||
*/
|
||||
@Test
|
||||
public void testParse() throws Exception {
|
||||
final String[][] testFiles = new String[][]{
|
||||
// meaning: filename in test/parsertest, mimetype, title, creator, description,
|
||||
new String[]{"umlaute_linux.xls", "application/msexcel", "In München steht ein Hofbräuhaus, dort gibt es Bier in Maßkrügen", "", ""},
|
||||
new String[]{"umlaute_mac.xls", "application/msexcel", "In München steht ein Hofbräuhaus, dort gibt es Bier in Maßkrügen", "", ""},
|
||||
new String[]{"umlaute_windows.xls", "application/msexcel", "In München steht ein Hofbräuhaus, dort gibt es Bier in Maßkrügen", "afieg", ""}
|
||||
|
||||
};
|
||||
|
||||
for (final String[] testFile : testFiles) {
|
||||
|
||||
final String filename = "test/parsertest/" + testFile[0];
|
||||
final File file = new File(filename);
|
||||
final String mimetype = testFile[1];
|
||||
final AnchorURL url = new AnchorURL("http://localhost/" + filename);
|
||||
|
||||
AbstractParser p = new xlsParser();
|
||||
final Document[] docs = p.parse(url, mimetype, null, new VocabularyScraper(), 0, new FileInputStream(file));
|
||||
for (final Document doc : docs) {
|
||||
final Reader content = new InputStreamReader(doc.getTextStream(), doc.getCharset());
|
||||
final StringBuilder str = new StringBuilder();
|
||||
int c;
|
||||
while ((c = content.read()) != -1) {
|
||||
str.append((char) c);
|
||||
}
|
||||
|
||||
System.out.println("Parsed " + filename + ": " + str);
|
||||
assertThat(str.toString(), containsString("In München steht ein Hofbräuhaus, dort gibt es Bier in Maßkrügen"));
|
||||
assertThat(doc.dc_creator(), containsString(testFile[3]));
|
||||
if (testFile[4].length() > 0) {
|
||||
assertThat(doc.dc_description()[0], containsString(testFile[4]));
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
}
|
Loading…
Reference in new issue