this.sb.crawlQueues.errorURL.push(request.url(), profile,FailCategory.TEMPORARY_NETWORK_FAILURE,"no redirection url provided, field '"+HeaderFramework.LOCATION+"' is empty",statusCode);
this.sb.crawlQueues.errorURL.push(request.url(),request.depth(),profile,FailCategory.TEMPORARY_NETWORK_FAILURE,"no redirection url provided, field '"+HeaderFramework.LOCATION+"' is empty",statusCode);
thrownewIOException("REJECTED EMTPY REDIRECTION '"+client.getHttpResponse().getStatusLine()+"' for URL '"+requestURLString+"'$");
}
@ -154,13 +154,13 @@ public final class HTTPLoader {
this.sb.crawlQueues.errorURL.push(request.url(), profile,FailCategory.FINAL_REDIRECT_RULE,"redirect to "+redirectionUrlString,statusCode);
this.sb.crawlQueues.errorURL.push(request.url(),request.depth(),profile,FailCategory.FINAL_REDIRECT_RULE,"redirect to "+redirectionUrlString,statusCode);
thrownewIOException("REJECTED URL "+request.url()+" because file size '"+contentLength+"' exceeds max filesize limit of "+maxFileSize+" bytes. (GET)$");
}
@ -201,7 +201,7 @@ public final class HTTPLoader {
returnresponse;
}else{
// if the response has not the right response type then reject file
this.sb.crawlQueues.errorURL.push(request.url(), profile,FailCategory.TEMPORARY_NETWORK_FAILURE,"wrong http status code",statusCode);
this.sb.crawlQueues.errorURL.push(request.url(),request.depth(),profile,FailCategory.TEMPORARY_NETWORK_FAILURE,"wrong http status code",statusCode);
thrownewIOException("REJECTED WRONG STATUS TYPE '"+client.getHttpResponse().getStatusLine()+"' for URL '"+requestURLString+"'$");
if(this.log.isInfo())this.log.info("Not Condensed Resource '"+urls+"': denied by document-attached noindexing rule");
// create a new errorURL DB entry
this.crawlQueues.errorURL.push(in.queueEntry.url(), profile,FailCategory.FINAL_PROCESS_CONTEXT,"denied by document-attached noindexing rule",-1);
this.crawlQueues.errorURL.push(in.queueEntry.url(),in.queueEntry.depth(),profile,FailCategory.FINAL_PROCESS_CONTEXT,"denied by document-attached noindexing rule",-1);
//if (this.log.isInfo()) log.logInfo("Not Indexed Resource '" + queueEntry.url().toNormalform(false, true) + "': denied by rule in document, process case=" + processCase);
// create a new errorURL DB entry
this.crawlQueues.errorURL.push(url, profile,FailCategory.FINAL_PROCESS_CONTEXT,"denied by rule in document, process case="+processCase,-1);
this.crawlQueues.errorURL.push(url,queueEntry.depth(),profile,FailCategory.FINAL_PROCESS_CONTEXT,"denied by rule in document, process case="+processCase,-1);