You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
yacy_search_server/htroot/WatchCrawler_p.html

187 lines
7.2 KiB

<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<title>YaCy Watch Crawler</title>
#%env/templates/metas.template%#
<script type="text/javascript" src="/js/ajax.js"></script>
<script type="text/javascript" src="/js/xml.js"></script>
<script type="text/javascript" src="/js/html.js"></script>
<script type="text/javascript" src="/js/WatchCrawler.js"></script>
</head>
<body>
#%env/templates/header.template%#
<h2>Crawler Monitor</h2>
<p>
Next update in <span id="nextUpdate" onclick="changeInterval()"></span> seconds.
</p>
<p><table border="0" cellpadding="0" cellspacing="0"><tr>
<td valign="top" rowspan="2"><table border="0" cellpadding="2" cellspacing="1">
<tbody>
<tr class="TableHeader">
<th>Queue</th>
<th>Size</th>
<th>Max</th>
</tr>
<tr class="TableCellLight">
<td align="left">Indexing</td>
<td align="right"><span id="indexingqueuesize">&nbsp;&nbsp;&nbsp;</span></td>
<td align="right"><span id="indexingqueuemax">&nbsp;&nbsp;&nbsp;</span></td>
</tr>
<tr class="TableCellLight">
<td align="left">Loader</td>
<td align="right"><span id="loaderqueuesize">&nbsp;&nbsp;&nbsp;</span></td>
<td align="right"><span id="loaderqueuemax">&nbsp;&nbsp;&nbsp;</span></td>
</tr>
<tr class="TableCellLight">
<td align="left">Local Crawler</td>
<td align="right"><span id="localcrawlerqueuesize">&nbsp;&nbsp;&nbsp;</span></td>
<td align="right">unlimited</td>
</tr>
<tr class="TableCellLight">
<td align="left">Remote Crawler</td>
<td align="right"><span id="remotecrawlerqueuesize">&nbsp;&nbsp;&nbsp;</span></td>
<td align="right">unlimited</td>
</tr>
</tbody>
</table></td>
<td width="6">&nbsp;</td>
<td valign="top"><table border="0" cellpadding="2" cellspacing="1">
<tbody>
<tr class="TableHeader">
<th>Database</th>
<th>Entries</th>
</tr>
<tr class="TableCellLight">
<td align="left">Pages (URLs)</td>
<td align="right"><span id="urldbsize">&nbsp;&nbsp;&nbsp;</span></td>
</tr>
<tr class="TableCellLight">
<td align="left">RWIs (Words)</td>
<td align="right"><span id="rwidbsize">&nbsp;&nbsp;&nbsp;</span></td>
</tr>
</tbody>
</table></td>
<td width="6">&nbsp;</td>
<td valign="top"><table border="0" cellpadding="2" cellspacing="1">
<tbody>
<tr class="TableHeader">
<th>Indicator</th>
<th colspan="2">Level</th>
</tr>
<tr class="TableCellLight">
<td align="left">PPM (Pages Per Minute)</td>
<td align="left"><span id="ppmNum">&nbsp;&nbsp;&nbsp;</span></td>
<td align="left"><span id="ppmSpan">&nbsp;&nbsp;&nbsp;</span></td>
</tr>
<tr class="TableCellLight">
<td align="left">RWI RAM (Word Cache)</td>
<td align="left"><span id="wordcacheNum">&nbsp;</span></td>
<td align="left"><span id="wordcacheSpan">&nbsp;</span></td>
</tr>
</tbody>
</table><td>
</tr><tr>
<td width="6">&nbsp;</td>
<td colspan="3"><p>
#(info)#<!-- 0 -->
::<!-- 1 -->
Error with profile management. Please stop YaCy, delete the file DATA/PLASMADB/crawlProfiles0.db and restart.
::<!-- 2 -->
Error: #[errmsg]#
::<!-- 3 -->
Application not yet initialized. Sorry. Please wait some seconds and repeat the request.
::<!-- 4 -->
<strong>ERROR: Crawl filter "#[newcrawlingfilter]#" does not match with crawl root "#[crawlingStart]#".</strong> Please try again with different filter.
::<!-- 5 -->
Crawling of "#[crawlingURL]#" failed. Reason: #[reasonString]#<br>
::<!-- 6 -->
Error with URL input "#[crawlingStart]#": #[error]#
::<!-- 7 -->
Error with file input "#[crawlingStart]#": #[error]#
::<!-- 8 -->
Crawling of "#[crawlingURL]#" started.
<strong>Please wait some seconds, it may take some seconds until the first result appears there.</strong>
If you crawl any un-wanted pages, you can delete them <a href="IndexCreateWWWLocalQueue_p.html">here</a>.<br />
#(/info)#
</p></td>
</tr></table></p>
<!-- crawl profile list -->
<p id="crawlingProfiles"><strong>Crawl Profiles:</strong><br />
<table border="0" cellpadding="2" cellspacing="1">
<colgroup>
<col width="120" />
<col />
<col width="16" />
<col width="60" />
<col width="10" span="2" />
<col />
<col width="10" span="5" />
</colgroup>
<tr class="TableHeader">
<td><strong>Crawl Thread</strong></td>
<td><strong>Start URL</strong></td>
<td><strong>Depth</strong></td>
<td><strong>Filter</strong></td>
<td><strong>MaxAge</strong></td>
<td><strong>Auto Filter Depth</strong></td>
<td><strong>Auto Filter Content</strong></td>
<td><strong>Max Page Per Domain</strong></td>
<td><strong>Accept '?' URLs</strong></td>
<td><strong>Fill Proxy Cache</strong></td>
<td><strong>Local Text Indexing</strong></td>
<td><strong>Local Media Indexing</strong></td>
<td><strong>Remote Indexing</strong></td>
<td></td>
</tr>
#{crawlProfiles}#
<tr class="TableCell#(dark)#Light::Dark#(/dark)#">
<td>#[name]#</td>
<td><a href="#[startURL]#">#[startURL]#</a></td>
<td>#[depth]#</td>
<td>#[filter]#</td>
<td>#[crawlingIfOlder]#</td>
<td>#[crawlingDomFilterDepth]#</td>
<td>#[crawlingDomFilterContent]#</td>
<td>#[crawlingDomMaxPages]#</td>
<td>#(withQuery)#no::yes#(/withQuery)#</td>
<td>#(storeCache)#no::yes#(/storeCache)#</td>
<td>#(indexText)#no::yes#(/indexText)#</td>
<td>#(indexMedia)#no::yes#(/indexMedia)#</td>
<td>#(remoteIndexing)#no::yes#(/remoteIndexing)#</td>
<td>#(deleteButton)#::<form action="WatchCrawler_p.html" method="get" enctype="multipart/form-data"><input type="hidden" name="handle" value="#[handle]#" /><input type="submit" name="deleteprofile" value="Delete" /></form>#(/deleteButton)#</td>
</tr>
#{/crawlProfiles}#
</table></p>
<!-- crawl queues -->
<p><p id="crawlingQueues"><strong>Crawl Queue:</strong><br />
<table border="0" cellpadding="2" cellspacing="1" id="queueTable">
<tbody>
<tr class="TableHeader">
<th>Queue</th>
<th>Profile</th>
<th>Initiator</th>
<th>Depth</th>
<th>Modified Date</th>
<th>Anchor Name</th>
<th>URL</th>
<th>Size</th>
<th>Delete</th>
</tr>
</tbody>
</table></p>
#%env/templates/footer.template%#
</body>
</html>