|
|
@ -1190,7 +1190,6 @@ public final class Switchboard extends serverSwitch
|
|
|
|
|
|
|
|
|
|
|
|
// remove heuristics
|
|
|
|
// remove heuristics
|
|
|
|
setConfig("heuristic.site", false);
|
|
|
|
setConfig("heuristic.site", false);
|
|
|
|
setConfig("heuristic.scroogle", false);
|
|
|
|
|
|
|
|
setConfig("heuristic.blekko", false);
|
|
|
|
setConfig("heuristic.blekko", false);
|
|
|
|
|
|
|
|
|
|
|
|
// relocate
|
|
|
|
// relocate
|
|
|
@ -3152,8 +3151,8 @@ public final class Switchboard extends serverSwitch
|
|
|
|
|
|
|
|
|
|
|
|
final Map<MultiProtocolURI, String> links;
|
|
|
|
final Map<MultiProtocolURI, String> links;
|
|
|
|
searchEvent.getRankingResult().oneFeederStarted();
|
|
|
|
searchEvent.getRankingResult().oneFeederStarted();
|
|
|
|
try {
|
|
|
|
try {
|
|
|
|
links = Switchboard.this.loader.loadLinks(url, CacheStrategy.NOCACHE);
|
|
|
|
links = Switchboard.this.loader.loadLinks(url, CacheStrategy.NOCACHE);
|
|
|
|
if ( links != null ) {
|
|
|
|
if ( links != null ) {
|
|
|
|
final Iterator<MultiProtocolURI> i = links.keySet().iterator();
|
|
|
|
final Iterator<MultiProtocolURI> i = links.keySet().iterator();
|
|
|
|
while ( i.hasNext() ) {
|
|
|
|
while ( i.hasNext() ) {
|
|
|
@ -3166,59 +3165,7 @@ public final class Switchboard extends serverSwitch
|
|
|
|
addAllToIndex(url, links, searchEvent, "site");
|
|
|
|
addAllToIndex(url, links, searchEvent, "site");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} catch ( final Throwable e ) {
|
|
|
|
} catch ( final Throwable e ) {
|
|
|
|
Log.logException(e);
|
|
|
|
Log.logException(e);
|
|
|
|
} finally {
|
|
|
|
|
|
|
|
searchEvent.getRankingResult().oneFeederTerminated();
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
}.start();
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
public final void heuristicScroogle(final SearchEvent searchEvent) {
|
|
|
|
|
|
|
|
new Thread() {
|
|
|
|
|
|
|
|
@Override
|
|
|
|
|
|
|
|
public void run() {
|
|
|
|
|
|
|
|
QueryParams query = searchEvent.getQuery();
|
|
|
|
|
|
|
|
String queryString = query.queryString(true);
|
|
|
|
|
|
|
|
final int meta = queryString.indexOf("heuristic:", 0);
|
|
|
|
|
|
|
|
if ( meta >= 0 ) {
|
|
|
|
|
|
|
|
final int q = queryString.indexOf(' ', meta);
|
|
|
|
|
|
|
|
queryString =
|
|
|
|
|
|
|
|
(q >= 0)
|
|
|
|
|
|
|
|
? queryString.substring(0, meta) + queryString.substring(q + 1)
|
|
|
|
|
|
|
|
: queryString.substring(0, meta);
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
final String urlString =
|
|
|
|
|
|
|
|
"http://www.scroogle.org/cgi-bin/nbbw.cgi?Gw="
|
|
|
|
|
|
|
|
+ queryString.trim().replaceAll(" ", "+")
|
|
|
|
|
|
|
|
+ "&n=2";
|
|
|
|
|
|
|
|
final DigestURI url;
|
|
|
|
|
|
|
|
try {
|
|
|
|
|
|
|
|
url = new DigestURI(MultiProtocolURI.unescape(urlString));
|
|
|
|
|
|
|
|
} catch ( final MalformedURLException e1 ) {
|
|
|
|
|
|
|
|
Log.logWarning("heuristicScroogle", "url not well-formed: '" + urlString + "'");
|
|
|
|
|
|
|
|
return;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
Map<MultiProtocolURI, String> links = null;
|
|
|
|
|
|
|
|
searchEvent.getRankingResult().oneFeederStarted();
|
|
|
|
|
|
|
|
try {
|
|
|
|
|
|
|
|
links = Switchboard.this.loader.loadLinks(url, CacheStrategy.NOCACHE);
|
|
|
|
|
|
|
|
if ( links != null ) {
|
|
|
|
|
|
|
|
final Iterator<MultiProtocolURI> i = links.keySet().iterator();
|
|
|
|
|
|
|
|
while ( i.hasNext() ) {
|
|
|
|
|
|
|
|
if ( i.next().toNormalform(false, false).indexOf("scroogle", 0) >= 0 ) {
|
|
|
|
|
|
|
|
i.remove();
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
Switchboard.this.log.logInfo("Heuristic: adding "
|
|
|
|
|
|
|
|
+ links.size()
|
|
|
|
|
|
|
|
+ " links from scroogle");
|
|
|
|
|
|
|
|
// add all pages to the index
|
|
|
|
|
|
|
|
addAllToIndex(null, links, searchEvent, "scroogle");
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
} catch ( final Throwable e ) {
|
|
|
|
|
|
|
|
//Log.logException(e);
|
|
|
|
|
|
|
|
} finally {
|
|
|
|
} finally {
|
|
|
|
searchEvent.getRankingResult().oneFeederTerminated();
|
|
|
|
searchEvent.getRankingResult().oneFeederTerminated();
|
|
|
|
}
|
|
|
|
}
|
|
|
|