@ -174,7 +174,7 @@ public class CrawlQueues {
// move some tasks to the core crawl job so we have something to do
final int toshift = Math . min ( 10 , limitCrawlJobSize ( ) ) ; // this cannot be a big number because the balancer makes a forced waiting if it cannot balance
for ( int i = 0 ; i < toshift ; i + + ) {
noticeURL . shift ( NoticedURL . STACK_TYPE_LIMIT , NoticedURL . STACK_TYPE_CORE );
noticeURL . shift ( NoticedURL . STACK_TYPE_LIMIT , NoticedURL . STACK_TYPE_CORE , sb . webIndex . profilesActiveCrawls );
}
log . logInfo ( "shifted " + toshift + " jobs from global crawl to local crawl (coreCrawlJobSize()=" + coreCrawlJobSize ( ) +
", limitCrawlJobSize()=" + limitCrawlJobSize ( ) + ", cluster.mode=" + sb . getConfig ( plasmaSwitchboardConstants . CLUSTER_MODE , "" ) +
@ -214,7 +214,7 @@ public class CrawlQueues {
while ( urlEntry = = null & & noticeURL . stackSize ( NoticedURL . STACK_TYPE_CORE ) > 0 ) {
final String stats = "LOCALCRAWL[" + noticeURL . stackSize ( NoticedURL . STACK_TYPE_CORE ) + ", " + noticeURL . stackSize ( NoticedURL . STACK_TYPE_LIMIT ) + ", " + noticeURL . stackSize ( NoticedURL . STACK_TYPE_OVERHANG ) + ", " + noticeURL . stackSize ( NoticedURL . STACK_TYPE_REMOTE ) + "]" ;
try {
urlEntry = noticeURL . pop ( NoticedURL . STACK_TYPE_CORE , true );
urlEntry = noticeURL . pop ( NoticedURL . STACK_TYPE_CORE , true , sb . webIndex . profilesActiveCrawls );
final String profileHandle = urlEntry . profileHandle ( ) ;
// System.out.println("DEBUG plasmaSwitchboard.processCrawling:
// profileHandle = " + profileHandle + ", urlEntry.url = " + urlEntry.url());
@ -224,7 +224,7 @@ public class CrawlQueues {
}
final CrawlProfile . entry profile = sb . webIndex . profilesActiveCrawls . getEntry ( profileHandle ) ;
if ( profile = = null ) {
log . logWarning ( stats + ": LOST PROFILE HANDLE '" + urlEntry . profileHandle ( ) + "' for URL " + urlEntry . url ( ) ) ;
log . logWarning ( stats + ": LOST LOCALCRAWL PROFILE HANDLE '" + urlEntry . profileHandle ( ) + "' for URL " + urlEntry . url ( ) ) ;
return true ;
}
@ -421,7 +421,7 @@ public class CrawlQueues {
final String stats = "REMOTETRIGGEREDCRAWL[" + noticeURL . stackSize ( NoticedURL . STACK_TYPE_CORE ) + ", " + noticeURL . stackSize ( NoticedURL . STACK_TYPE_LIMIT ) + ", " + noticeURL . stackSize ( NoticedURL . STACK_TYPE_OVERHANG ) + ", "
+ noticeURL . stackSize ( NoticedURL . STACK_TYPE_REMOTE ) + "]" ;
try {
final CrawlEntry urlEntry = noticeURL . pop ( NoticedURL . STACK_TYPE_REMOTE , true );
final CrawlEntry urlEntry = noticeURL . pop ( NoticedURL . STACK_TYPE_REMOTE , true , sb . webIndex . profilesActiveCrawls );
final String profileHandle = urlEntry . profileHandle ( ) ;
// System.out.println("DEBUG plasmaSwitchboard.processCrawling:
// profileHandle = " + profileHandle + ", urlEntry.url = " +
@ -429,7 +429,7 @@ public class CrawlQueues {
final CrawlProfile . entry profile = sb . webIndex . profilesActiveCrawls . getEntry ( profileHandle ) ;
if ( profile = = null ) {
log . logWarning ( stats + ": LOST PROFILE HANDLE '" + urlEntry . profileHandle ( ) + "' for URL " + urlEntry . url ( ) ) ;
log . logWarning ( stats + ": LOST REMOTETRIGGEREDCRAWL PROFILE HANDLE '" + urlEntry . profileHandle ( ) + "' for URL " + urlEntry . url ( ) ) ;
return false ;
}