@ -170,7 +170,7 @@ public final class CrawlSwitchboard {
CrawlProfile . getRecrawlDate ( CRAWL_PROFILE_PROXY_RECRAWL_CYCLE ) , - 1 , false ,
true /*getConfigBool(PROXY_INDEXING_LOCAL_TEXT, true)*/ ,
true /*getConfigBool(PROXY_INDEXING_LOCAL_MEDIA, true)*/ ,
true , true ,
true ,
false /*getConfigBool(PROXY_INDEXING_REMOTE, false)*/ , true , true , true ,
CrawlProfile . CacheStrategy . IFFRESH ) ;
this . profilesActiveCrawls . put ( this . defaultProxyProfile . handle ( ) . getBytes ( ) , this . defaultProxyProfile ) ;
@ -178,38 +178,38 @@ public final class CrawlSwitchboard {
if ( this . defaultRemoteProfile = = null ) {
// generate new default entry for remote crawling
this . defaultRemoteProfile = new CrawlProfile ( CRAWL_PROFILE_REMOTE , null , CrawlProfile . MATCH_ALL , CrawlProfile . MATCH_NEVER , 0 ,
- 1 , - 1 , true , true , true , false , true, false, true , true , false , CrawlProfile . CacheStrategy . IFFRESH ) ;
- 1 , - 1 , true , true , true , false , false, true , true , false , CrawlProfile . CacheStrategy . IFFRESH ) ;
this . profilesActiveCrawls . put ( this . defaultRemoteProfile . handle ( ) . getBytes ( ) , this . defaultRemoteProfile ) ;
}
if ( this . defaultTextSnippetLocalProfile = = null ) {
// generate new default entry for snippet fetch and optional crawling
this . defaultTextSnippetLocalProfile = new CrawlProfile ( CRAWL_PROFILE_SNIPPET_LOCAL_TEXT , null , CrawlProfile . MATCH_ALL , CrawlProfile . MATCH_NEVER , 0 ,
CrawlProfile . getRecrawlDate ( CRAWL_PROFILE_SNIPPET_LOCAL_TEXT_RECRAWL_CYCLE ) , - 1 , true , false , false , true , true, false, true , true , false , CrawlProfile . CacheStrategy . IFFRESH ) ;
CrawlProfile . getRecrawlDate ( CRAWL_PROFILE_SNIPPET_LOCAL_TEXT_RECRAWL_CYCLE ) , - 1 , true , false , false , true , false, true , true , false , CrawlProfile . CacheStrategy . IFFRESH ) ;
this . profilesActiveCrawls . put ( this . defaultTextSnippetLocalProfile . handle ( ) . getBytes ( ) , this . defaultTextSnippetLocalProfile ) ;
}
if ( this . defaultTextSnippetGlobalProfile = = null ) {
// generate new default entry for snippet fetch and optional crawling
this . defaultTextSnippetGlobalProfile = new CrawlProfile ( CRAWL_PROFILE_SNIPPET_GLOBAL_TEXT , null , CrawlProfile . MATCH_ALL , CrawlProfile . MATCH_NEVER , 0 ,
CrawlProfile . getRecrawlDate ( CRAWL_PROFILE_SNIPPET_GLOBAL_TEXT_RECRAWL_CYCLE ) , - 1 , true , true , true , true , true, false, true , true , false , CrawlProfile . CacheStrategy . IFEXIST ) ;
CrawlProfile . getRecrawlDate ( CRAWL_PROFILE_SNIPPET_GLOBAL_TEXT_RECRAWL_CYCLE ) , - 1 , true , true , true , true , false, true , true , false , CrawlProfile . CacheStrategy . IFEXIST ) ;
this . profilesActiveCrawls . put ( this . defaultTextSnippetGlobalProfile . handle ( ) . getBytes ( ) , this . defaultTextSnippetGlobalProfile ) ;
}
this . defaultTextSnippetGlobalProfile . setCacheStrategy ( CrawlProfile . CacheStrategy . IFEXIST ) ;
if ( this . defaultMediaSnippetLocalProfile = = null ) {
// generate new default entry for snippet fetch and optional crawling
this . defaultMediaSnippetLocalProfile = new CrawlProfile ( CRAWL_PROFILE_SNIPPET_LOCAL_MEDIA , null , CrawlProfile . MATCH_ALL , CrawlProfile . MATCH_NEVER , 0 ,
CrawlProfile . getRecrawlDate ( CRAWL_PROFILE_SNIPPET_LOCAL_MEDIA_RECRAWL_CYCLE ) , - 1 , true , false , false , true , false , false, true, true , false , CrawlProfile . CacheStrategy . IFEXIST ) ;
CrawlProfile . getRecrawlDate ( CRAWL_PROFILE_SNIPPET_LOCAL_MEDIA_RECRAWL_CYCLE ) , - 1 , true , false , false , true , false , true, true , false , CrawlProfile . CacheStrategy . IFEXIST ) ;
this . profilesActiveCrawls . put ( this . defaultMediaSnippetLocalProfile . handle ( ) . getBytes ( ) , this . defaultMediaSnippetLocalProfile ) ;
}
if ( this . defaultMediaSnippetGlobalProfile = = null ) {
// generate new default entry for snippet fetch and optional crawling
this . defaultMediaSnippetGlobalProfile = new CrawlProfile ( CRAWL_PROFILE_SNIPPET_GLOBAL_MEDIA , null , CrawlProfile . MATCH_ALL , CrawlProfile . MATCH_NEVER , 0 ,
CrawlProfile . getRecrawlDate ( CRAWL_PROFILE_SNIPPET_GLOBAL_MEDIA_RECRAWL_CYCLE ) , - 1 , true , false , true , true , true, false, true , true , false , CrawlProfile . CacheStrategy . IFEXIST ) ;
CrawlProfile . getRecrawlDate ( CRAWL_PROFILE_SNIPPET_GLOBAL_MEDIA_RECRAWL_CYCLE ) , - 1 , true , false , true , true , false, true , true , false , CrawlProfile . CacheStrategy . IFEXIST ) ;
this . profilesActiveCrawls . put ( this . defaultMediaSnippetGlobalProfile . handle ( ) . getBytes ( ) , this . defaultMediaSnippetGlobalProfile ) ;
}
if ( this . defaultSurrogateProfile = = null ) {
// generate new default entry for surrogate parsing
this . defaultSurrogateProfile = new CrawlProfile ( CRAWL_PROFILE_SURROGATE , null , CrawlProfile . MATCH_ALL , CrawlProfile . MATCH_NEVER , 0 ,
CrawlProfile . getRecrawlDate ( CRAWL_PROFILE_SURROGATE_RECRAWL_CYCLE ) , - 1 , true , true , false , false , false , false, true, true , false , CrawlProfile . CacheStrategy . NOCACHE ) ;
CrawlProfile . getRecrawlDate ( CRAWL_PROFILE_SURROGATE_RECRAWL_CYCLE ) , - 1 , true , true , false , false , false , true, true , false , CrawlProfile . CacheStrategy . NOCACHE ) ;
this . profilesActiveCrawls . put ( this . defaultSurrogateProfile . handle ( ) . getBytes ( ) , this . defaultSurrogateProfile ) ;
}
}