it is now possible to get the results in two steps:
- first retrieve all IDs as given for a query
- then retieve each document individually
This was necessary for very large result sets where a query may run for
hours and is possibly terminated by a solr-internal timeout. This occurs
regulary during postprocessing and therefore this commit may fix
unwanted postprocessing terminations.
((freshdate!=null&&freshdate.before(newDate()))?(" AND "+CollectionSchema.load_date_dt.getSolrFieldName()+":[* TO "+ISO8601Formatter.FORMATTER.format(freshdate)+"]"):"");
BlockingQueue<SolrDocument>docs=Fulltext.this.getDefaultConnector().concurrentDocumentsByQuery(this.query+" AND "+CollectionSchema.httpstatus_i.getSolrFieldName()+":200",null,0,100000000,Long.MAX_VALUE,100,1,
BlockingQueue<SolrDocument>docs=Fulltext.this.getDefaultConnector().concurrentDocumentsByQuery(this.query+" AND "+CollectionSchema.httpstatus_i.getSolrFieldName()+":200",null,0,100000000,Long.MAX_VALUE,100,1,true,
@ -1056,7 +1056,7 @@ public class CollectionConfiguration extends SchemaConfiguration implements Seri
// To do so, we first must collect all canonical links, find all references to them, get the anchor list of the documents and patch the citation reference of these links
Stringpatchquery=CollectionSchema.host_s.getSolrFieldName()+":"+host+" AND "+CollectionSchema.canonical_s.getSolrFieldName()+AbstractSolrConnector.CATCHALL_DTERM;
@ -1260,7 +1260,7 @@ public class CollectionConfiguration extends SchemaConfiguration implements Seri
CollectionSchema.host_subdomain_s.getSolrFieldName()+" asc,"+// sort on subdomain to get hosts without subdomain first; that gives an opportunity to set www_unique_b flag to false
CollectionSchema.url_protocol_s.getSolrFieldName()+" asc"// sort on protocol to get http before https; that gives an opportunity to set http_unique_b flag to false
q.append(CollectionSchema.host_s.getSolrFieldName()).append(':').append(hostname).append(" OR ").append(CollectionSchema.host_s.getSolrFieldName()).append(':').append("www.").append(hostname);