From fc924f024e2430600e454dd20919a5ce3cebbfe3 Mon Sep 17 00:00:00 2001 From: orbiter Date: Mon, 13 Sep 2010 10:13:34 +0000 Subject: [PATCH] import of oai sources from a list using a command line interface: if you have a list of oai servers you can import them all using the linux command: bin/importOAIList.sh git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@7141 6c8d7289-2bf4-0310-a012-ef5d649a1542 --- bin/importOAIList.sh | 9 +++++++++ htroot/IndexImportOAIPMH_p.java | 2 ++ 2 files changed, 11 insertions(+) create mode 100755 bin/importOAIList.sh diff --git a/bin/importOAIList.sh b/bin/importOAIList.sh new file mode 100755 index 000000000..98dc90944 --- /dev/null +++ b/bin/importOAIList.sh @@ -0,0 +1,9 @@ +#!/bin/sh +cd "`dirname $0`" +for N in `cat $1`; do + echo import of $N: + ./apicall.sh /IndexImportOAIPMH_p.html?urlstart=$N > /dev/null + C=$(($C+1)) +done + + diff --git a/htroot/IndexImportOAIPMH_p.java b/htroot/IndexImportOAIPMH_p.java index 8348506a6..1b6e4b566 100644 --- a/htroot/IndexImportOAIPMH_p.java +++ b/htroot/IndexImportOAIPMH_p.java @@ -36,6 +36,7 @@ import net.yacy.document.importer.ResumptionToken; import net.yacy.kelondro.data.meta.DigestURI; import net.yacy.kelondro.logging.Log; +import de.anomic.data.WorkTables; import de.anomic.search.Switchboard; import de.anomic.server.serverObjects; import de.anomic.server.serverSwitch; @@ -89,6 +90,7 @@ public class IndexImportOAIPMH_p { if (post.get("urlstart", "").length() > 0) { String oaipmhurl = post.get("urlstart", ""); + sb.tables.recordAPICall(post, "IndexImportOAIPMH_p.html", WorkTables.TABLE_API_TYPE_CRAWLER, "OAI-PMH import for " + oaipmhurl); DigestURI url = null; try { url = new DigestURI(oaipmhurl, null);