@ -190,14 +190,8 @@ public class SchemaConfiguration extends Configuration implements Serializable {
continueuniquecheck;
}
try{
SolrDocumentListdocs=segment.fulltext().getDefaultConnector().getDocumentListByQuery("-"+CollectionSchema.id.getSolrFieldName()+":\""+urlhash+"\" AND "+CollectionSchema.host_id_s.getSolrFieldName()+":\""+hostid+"\" AND "+signaturefield.getSolrFieldName()+":\""+signature.toString()+"\"",null,0,100,CollectionSchema.id.getSolrFieldName());
longdoccount=segment.fulltext().getDefaultConnector().getCountByQuery("-"+CollectionSchema.id.getSolrFieldName()+":\""+urlhash+"\" AND "+CollectionSchema.host_id_s.getSolrFieldName()+":\""+hostid+"\" AND "+signaturefield.getSolrFieldName()+":\""+signature.toString()+"\"");
// this tag may have values: all, index, noindex, nofollow; see http://www.robotstxt.org/meta.html
if(robots_meta!=null){
robots_meta=robots_meta.toLowerCase();
if(robots_meta.indexOf("all",0)>=0)b+=1;// set bit 0
if(robots_meta.indexOf("index",0)==0||robots_meta.indexOf(" index",0)>=0||robots_meta.indexOf(",index",0)>=0)b+=2;// set bit 1
if(robots_meta.indexOf("follow",0)==0||robots_meta.indexOf(" follow",0)>=0||robots_meta.indexOf(",follow",0)>=0)b+=4;// set bit 2
@ -579,6 +578,7 @@ public class CollectionConfiguration extends SchemaConfiguration implements Seri
}
}
if(!x_robots_tag.isEmpty()){
x_robots_tag=x_robots_tag.toLowerCase();
// this tag may have values: all, noindex, nofollow, noarchive, nosnippet, noodp, notranslate, noimageindex, unavailable_after, none; see https://developers.google.com/webmasters/control-crawl-index/docs/robots_meta_tag?hl=de
if(x_robots_tag.indexOf("all",0)>=0)b+=1<<8;// set bit 8
if(x_robots_tag.indexOf("noindex",0)>=0||x_robots_tag.indexOf("none",0)>=0)b+=1<<9;// set bit 9
@ -754,14 +754,14 @@ public class CollectionConfiguration extends SchemaConfiguration implements Seri