- introduced blocking queues in CrawlStacker to make it ready for concurrency
- added a second busy thread for the CrawlStacker
The CrawlStacker is multithreaded. It shall be transformed into a BlockingThread in another step.
The concurrency of the stacker will hopefully solve some problems with cases where DNS blocks.
git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5395 6c8d7289-2bf4-0310-a012-ef5d649a1542
@ -578,8 +578,10 @@ public final class plasmaSwitchboard extends serverAbstractSwitch<IndexingStack.
deployThread(plasmaSwitchboardConstants.CLEANUP,"Cleanup","simple cleaning process for monitoring information",null,
newserverInstantBusyThread(this,plasmaSwitchboardConstants.CLEANUP_METHOD_START,plasmaSwitchboardConstants.CLEANUP_METHOD_JOBCOUNT,plasmaSwitchboardConstants.CLEANUP_METHOD_FREEMEM),600000);// all 5 Minutes, wait 10 minutes until first run
deployThread(plasmaSwitchboardConstants.CRAWLSTACK,"Crawl URL Stacker","process that checks url for double-occurrences and for allowance/disallowance by robots.txt",null,
deployThread(plasmaSwitchboardConstants.CRAWLSTACK0,"Crawl URL Stacker","process that checks url for double-occurrences and for allowance/disallowance by robots.txt",null,
deployThread(plasmaSwitchboardConstants.CRAWLSTACK1,"Crawl URL Stacker","process that checks url for double-occurrences and for allowance/disallowance by robots.txt",null,
deployThread(plasmaSwitchboardConstants.INDEXER,"Indexing","thread that either initiates a parsing/indexing queue, distributes the index into the DHT, stores parsed documents or flushes the index cache","/IndexCreateIndexingQueue_p.html",
deployThread(plasmaSwitchboardConstants.CRAWLJOB_REMOTE_TRIGGERED_CRAWL,"Remote Crawl Job","thread that performes a single crawl/indexing step triggered by a remote peer",null,
@ -716,6 +718,7 @@ public final class plasmaSwitchboard extends serverAbstractSwitch<IndexingStack.