finalStringlicense=URLLicense.aquireLicense(image.imageUrl);// this is just the license key to get the image forwarded through the YaCy thumbnail viewer, not an actual lawful license
finalStringlicense=URLLicense.aquireLicense(image.imageUrl);// this is just the license key to get the image forwarded through the YaCy thumbnail viewer, not an actual lawful license
@ -53,10 +54,11 @@ public class RecrawlBusyThread extends AbstractBusyThread {
privateStringcurrentQuery=CollectionSchema.fresh_date_dt.getSolrFieldName()+":[* TO NOW/DAY-1DAY]";// current query
privateStringcurrentQuery=CollectionSchema.fresh_date_dt.getSolrFieldName()+":[* TO NOW/DAY-1DAY]";// current query
privatebooleanincludefailed=false;// flag if docs with httpstatus_i <> 200 shall be recrawled
privatebooleanincludefailed=false;// flag if docs with httpstatus_i <> 200 shall be recrawled
privateintchunkstart=0;
privateintchunkstart=0;
privateintchunksize=200;
privatefinalintchunksize;
finalSwitchboardsb;
finalSwitchboardsb;
privatefinalSet<DigestURL>urlstack;// buffer of urls to recrawl
privatefinalSet<DigestURL>urlstack;// buffer of urls to recrawl
publiclongurlsfound=0;
publiclongurlsfound=0;
privateStringsolrSortBy;
publicRecrawlBusyThread(Switchboardxsb){
publicRecrawlBusyThread(Switchboardxsb){
super(3000,1000);// set lower limits of cycle delay
super(3000,1000);// set lower limits of cycle delay
@ -66,6 +68,10 @@ public class RecrawlBusyThread extends AbstractBusyThread {
this.sb=xsb;
this.sb=xsb;
urlstack=newHashSet<DigestURL>();
urlstack=newHashSet<DigestURL>();
// workaround to prevent solr exception on existing index (not fully reindexed) since intro of schema with docvalues
// org.apache.solr.core.SolrCore java.lang.IllegalStateException: unexpected docvalues type NONE for field 'load_date_dt' (expected=NUMERIC). Use UninvertingReader or index with docvalues.
SUPPORTED_MIME_TYPES.add("image/jpg");// this is in fact a 'wrong' mime type. We leave it here because that is a common error that occurs in the internet frequently
SUPPORTED_MIME_TYPES.add("image/jpg");// this is in fact a 'wrong' mime type. We leave it here because that is a common error that occurs in the internet frequently