to re-crawl documents with fresh_date_dt before today.==um Dokumente mit fresh_date_dt vor Heute erneut zu crawlen.
after starting the recrawl job you can apply a custom Solr query to select documents to be processed==nach dem Start des Re-Crawl-Jobs kann die Solr Abfrage bearbeitet werden um gewünschte Dokumente zu verarbeiten
super(3000,1000);// set lower limits of cycle delay
super(3000,1000);// set lower limits of cycle delay
setName(THREAD_NAME);
setName(THREAD_NAME);
this.setIdleSleep(10*60000);// set actual cycle delays
this.setIdleSleep(10*60000);// set actual cycle delays
@ -68,6 +90,8 @@ public class RecrawlBusyThread extends AbstractBusyThread {
this.setPriority(Thread.MIN_PRIORITY);
this.setPriority(Thread.MIN_PRIORITY);
this.sb=xsb;
this.sb=xsb;
this.currentQuery=query;
this.includefailed=includeFailed;
urlstack=newHashSet<DigestURL>();
urlstack=newHashSet<DigestURL>();
// workaround to prevent solr exception on existing index (not fully reindexed) since intro of schema with docvalues
// workaround to prevent solr exception on existing index (not fully reindexed) since intro of schema with docvalues
// org.apache.solr.core.SolrCore java.lang.IllegalStateException: unexpected docvalues type NONE for field 'load_date_dt' (expected=NUMERIC). Use UninvertingReader or index with docvalues.
// org.apache.solr.core.SolrCore java.lang.IllegalStateException: unexpected docvalues type NONE for field 'load_date_dt' (expected=NUMERIC). Use UninvertingReader or index with docvalues.
@ -91,6 +115,19 @@ public class RecrawlBusyThread extends AbstractBusyThread {