- one try to fix the httpd problem

- fix for handling of collection index that appears when removing elements
- added another navigation method (stub, not working yet)

git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@4543 6c8d7289-2bf4-0310-a012-ef5d649a1542
pull/1/head
orbiter 17 years ago
parent 7cc4ff05c9
commit 9eddc1506b

@ -25,6 +25,7 @@
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA // Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
import java.util.Iterator; import java.util.Iterator;
import java.util.Map;
import java.util.Set; import java.util.Set;
import java.util.TreeSet; import java.util.TreeSet;
@ -36,6 +37,7 @@ import de.anomic.plasma.plasmaSearchQuery;
import de.anomic.plasma.plasmaSwitchboard; import de.anomic.plasma.plasmaSwitchboard;
import de.anomic.server.serverObjects; import de.anomic.server.serverObjects;
import de.anomic.server.serverSwitch; import de.anomic.server.serverSwitch;
import de.anomic.yacy.yacyURL;
public class sidebar_navigation { public class sidebar_navigation {
@ -119,15 +121,34 @@ public class sidebar_navigation {
prop.put("navigation_topwords_words_" + hintcount + "_resource", theQuery.searchdom()); prop.put("navigation_topwords_words_" + hintcount + "_resource", theQuery.searchdom());
prop.put("navigation_topwords_words_" + hintcount + "_zonecode", theQuery.zonecode); prop.put("navigation_topwords_words_" + hintcount + "_zonecode", theQuery.zonecode);
} }
prop.put("navigation_topwords_words", hintcount); hintcount++;
if (hintcount++ > MAX_TOPWORDS) { if (hintcount >= MAX_TOPWORDS) break;
break;
}
} }
prop.put("navigation_topwords_words", hintcount);
prop.put("navigation_topwords", "1"); prop.put("navigation_topwords", "1");
} }
} }
// compose language zone drill-down
int c = 0;
final Iterator<Map.Entry<String, Integer>> iter = theSearch.getRankingResult().getZoneStatistics().entrySet().iterator();
Map.Entry<String, Integer> entry;
while (iter.hasNext()) {
entry = iter.next();
if ((theQuery == null) || (theQuery.queryString == null)) break;
prop.putHTML("navigation_languagezone_zones_" + c + "_zone", entry.getKey() + " (" + entry.getValue() + ")");
prop.putHTML("navigation_languagezone_zones_" + c + "_search", theQuery.queryString.replace(' ', '+'));
prop.put("navigation_languagezone_zones_" + c + "_count", theQuery.displayResults());
prop.put("navigation_languagezone_zones_" + c + "_offset", "0");
prop.put("navigation_languagezone_zones_" + c + "_contentdom", theQuery.contentdom());
prop.put("navigation_languagezone_zones_" + c + "_resource", theQuery.searchdom());
prop.put("navigation_languagezone_zones_" + c + "_zonecode", yacyURL.zone2map.get(entry.getKey()).intValue());
prop.put("navigation_languagezone_zones", c);
c++;
}
prop.put("navigation_languagezone", (c > 2) ? "1" : "0");
// compose page navigation // compose page navigation
StringBuffer resnav = new StringBuffer(); StringBuffer resnav = new StringBuffer();
int thispage = offset / theQuery.displayResults(); int thispage = offset / theQuery.displayResults();

@ -851,7 +851,17 @@ public final class httpdFileHandler {
if (chunkedOut != null) { if (chunkedOut != null) {
chunkedOut.finish(); chunkedOut.finish();
} }
}
// flush all
try {newOut.flush();}catch (Exception e) {}
// wait a little time until everything closes so that clients can read from the streams/sockets
if ((contentLength >= 0) && ((String)requestHeader.get(httpHeader.CONNECTION, "close")).indexOf("keep-alive") == -1) {
// in case that the client knows the size in advance (contentLength present) the waiting will have no effect on the interface performance
// but if the client waits on a connection interruption this will slow down.
try {Thread.sleep(2000);} catch (InterruptedException e) {} // FIXME: is this necessary?
}
}
// check mime type again using the result array: these are 'magics' // check mime type again using the result array: these are 'magics'
// if (serverByteBuffer.equals(result, 1, "PNG".getBytes())) mimeType = mimeTable.getProperty("png","text/html"); // if (serverByteBuffer.equals(result, 1, "PNG".getBytes())) mimeType = mimeTable.getProperty("png","text/html");
@ -921,10 +931,6 @@ public final class httpdFileHandler {
} finally { } finally {
try {out.flush();}catch (Exception e) {} try {out.flush();}catch (Exception e) {}
if (((String)requestHeader.get(httpHeader.CONNECTION, "close")).indexOf("keep-alive") == -1) {
// wait a little time until everything closes so that clients can read from the streams/sockets
try {Thread.sleep(50);} catch (InterruptedException e) {} // FIXME: is this necessary?
}
} }
} }

@ -920,7 +920,7 @@ public class kelondroCollectionIndex {
array_remove( array_remove(
oldPartitionNumber, serialNumber, this.payloadrow.objectsize, oldPartitionNumber, serialNumber, this.payloadrow.objectsize,
oldrownumber); oldrownumber);
index.remove(key, true); index.remove(key, false);
return removed; return removed;
} }

@ -68,6 +68,7 @@ public final class plasmaSearchRankingProcess {
private TreeSet<String> misses; // contains url-hashes that could not been found in the LURL-DB private TreeSet<String> misses; // contains url-hashes that could not been found in the LURL-DB
private plasmaWordIndex wordIndex; private plasmaWordIndex wordIndex;
private HashMap<String, indexContainer>[] localSearchContainerMaps; private HashMap<String, indexContainer>[] localSearchContainerMaps;
private int[] domZones;
public plasmaSearchRankingProcess(plasmaWordIndex wordIndex, plasmaSearchQuery query, int maxentries, int concurrency) { public plasmaSearchRankingProcess(plasmaWordIndex wordIndex, plasmaSearchQuery query, int maxentries, int concurrency) {
// we collect the urlhashes and construct a list with urlEntry objects // we collect the urlhashes and construct a list with urlEntry objects
@ -90,6 +91,8 @@ public final class plasmaSearchRankingProcess {
this.wordIndex = wordIndex; this.wordIndex = wordIndex;
this.flagcount = new int[32]; this.flagcount = new int[32];
for (int i = 0; i < 32; i++) {this.flagcount[i] = 0;} for (int i = 0; i < 32; i++) {this.flagcount[i] = 0;}
this.domZones = new int[8];
for (int i = 0; i < 8; i++) {this.domZones[i] = 0;}
} }
public long ranking(indexRWIVarEntry word) { public long ranking(indexRWIVarEntry word) {
@ -176,6 +179,10 @@ public final class plasmaSearchRankingProcess {
continue; continue;
} }
// count domZones
System.out.println("DEBUG domDomain dom=" + wordIndex.loadedURL.load(iEntry.urlHash, iEntry, 0).comp().url().getHost() + ", zone=" + yacyURL.domDomain(iEntry.urlHash()));
this.domZones[yacyURL.domDomain(iEntry.urlHash())]++;
// insert // insert
if ((maxentries < 0) || (stack.size() < maxentries)) { if ((maxentries < 0) || (stack.size() < maxentries)) {
// in case that we don't have enough yet, accept any new entry // in case that we don't have enough yet, accept any new entry
@ -327,6 +334,10 @@ public final class plasmaSearchRankingProcess {
return this.local_resourceSize; return this.local_resourceSize;
} }
public Map<String, Integer> getZoneStatistics() {
return yacyURL.zoneStatistics(this.domZones);
}
public indexRWIEntry remove(String urlHash) { public indexRWIEntry remove(String urlHash) {
kelondroSortStack<indexRWIVarEntry>.stackElement se = stack.remove(urlHash.hashCode()); kelondroSortStack<indexRWIVarEntry>.stackElement se = stack.remove(urlHash.hashCode());
if (se == null) return null; if (se == null) return null;

@ -31,6 +31,7 @@ import java.io.File;
import java.net.MalformedURLException; import java.net.MalformedURLException;
import java.util.HashMap; import java.util.HashMap;
import java.util.Iterator; import java.util.Iterator;
import java.util.Map;
import java.util.TreeSet; import java.util.TreeSet;
import java.util.regex.Matcher; import java.util.regex.Matcher;
import java.util.regex.Pattern; import java.util.regex.Pattern;
@ -382,7 +383,7 @@ public class yacyURL {
public static final int language_domain_africa_zone = 128 + 32; //{5, 7}; public static final int language_domain_africa_zone = 128 + 32; //{5, 7};
public static final int language_domain_any_zone = 255; public static final int language_domain_any_zone = 255;
public static final String[] regions = {"europe", "english", "spanish", "asia", "middleeast", "africa"}; public static final HashMap<String, Integer> zone2map = new HashMap<String, Integer>();
static { static {
// create a dummy hash // create a dummy hash
@ -398,6 +399,14 @@ public class yacyURL {
insertTLDProps(TLD_Africa, 5); // africa insertTLDProps(TLD_Africa, 5); // africa
insertTLDProps(TLD_Generic, 6); // anything else, mixed languages, mainly english insertTLDProps(TLD_Generic, 6); // anything else, mixed languages, mainly english
// the id=7 is used to flag local addresses // the id=7 is used to flag local addresses
zone2map.put("europe", language_domain_europe_zone);
zone2map.put("english", language_domain_english_zone);
zone2map.put("spanish", language_domain_spanish_zone);
zone2map.put("asia", language_domain_asia_zone);
zone2map.put("middleeast", language_domain_middleeast_zone);
zone2map.put("africa", language_domain_africa_zone);
zone2map.put("any", language_domain_any_zone);
} }
// class variables // class variables
@ -1093,7 +1102,7 @@ public class yacyURL {
// returns the ID of the domain of the domain // returns the ID of the domain of the domain
assert (urlHash != null); assert (urlHash != null);
assert (urlHash.length() == 12) : "urlhash = " + urlHash; assert (urlHash.length() == 12) : "urlhash = " + urlHash;
return (kelondroBase64Order.enhancedCoder.decodeByte(urlHash.charAt(11)) & 12) >> 2; return (kelondroBase64Order.enhancedCoder.decodeByte(urlHash.charAt(11)) & 28) >> 2;
} }
public static boolean isLocalDomain(String urlhash) { public static boolean isLocalDomain(String urlhash) {
@ -1123,6 +1132,26 @@ public class yacyURL {
return language; return language;
} }
public static Map<String, Integer> zoneStatistics(int[] domAccumulators) {
assert domAccumulators.length == 8;
HashMap<String, Integer> zoneCounter = new HashMap<String, Integer>();
Iterator<Map.Entry<String, Integer>> j;
Map.Entry<String, Integer> entry;
for (int i = 0; i < 8; i++) {
j = zone2map.entrySet().iterator();
while (j.hasNext()) {
entry = j.next();
if ((i & entry.getValue().intValue()) != 0) {
if (zoneCounter.containsKey(entry.getKey())) {
zoneCounter.put(entry.getKey(), zoneCounter.get(entry.getKey()) + domAccumulators[i]);
} else {
zoneCounter.put(entry.getKey(), domAccumulators[i]);
}
}
}
}
return zoneCounter;
}
public static void main(String[] args) { public static void main(String[] args) {
String[][] test = new String[][]{ String[][] test = new String[][]{

Loading…
Cancel
Save