- added and removed some debugging output

- fixed a bug with merge method
- patched wrong output of language identification (not fixed, only patched!)

git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5181 6c8d7289-2bf4-0310-a012-ef5d649a1542
pull/1/head
orbiter 17 years ago
parent ce2a7ed116
commit e1f67262f7

@ -365,7 +365,7 @@ public class Balancer {
public synchronized void push(final CrawlEntry entry) throws IOException { public synchronized void push(final CrawlEntry entry) throws IOException {
assert entry != null; assert entry != null;
if (urlFileIndex.has(entry.url().hash().getBytes())) { if (urlFileIndex.has(entry.url().hash().getBytes())) {
serverLog.logWarning("PLASMA BALANCER", "double-check has failed for urlhash " + entry.url().hash() + " in " + stackname + " - fixed"); serverLog.logWarning("BALANCER", "double-check has failed for urlhash " + entry.url().hash() + " in " + stackname + " - fixed");
return; return;
} }
@ -534,7 +534,7 @@ public class Balancer {
// emergency case: this means that something with the stack organization is wrong // emergency case: this means that something with the stack organization is wrong
// the file appears to be broken. We kill the file. // the file appears to be broken. We kill the file.
kelondroStack.reset(urlFileStack); kelondroStack.reset(urlFileStack);
serverLog.logSevere("PLASMA BALANCER", "get() failed to fetch entry from file stack. reset stack file."); serverLog.logSevere("BALANCER", "get() failed to fetch entry from file stack. reset stack file.");
} else { } else {
final String nexthash = new String(nextentry.getColBytes(0)); final String nexthash = new String(nextentry.getColBytes(0));
@ -554,7 +554,7 @@ public class Balancer {
// check case where we did not found anything // check case where we did not found anything
if (result == null) { if (result == null) {
serverLog.logSevere("PLASMA BALANCER", "get() was not able to find a valid urlhash - total size = " + size() + ", fileStack.size() = " + urlFileStack.size() + ", ramStack.size() = " + urlRAMStack.size() + ", domainStacks.size() = " + domainStacks.size()); serverLog.logSevere("BALANCER", "get() was not able to find a valid urlhash - total size = " + size() + ", fileStack.size() = " + urlFileStack.size() + ", ramStack.size() = " + urlRAMStack.size() + ", domainStacks.size() = " + domainStacks.size());
return null; return null;
} }
@ -573,7 +573,7 @@ public class Balancer {
// in best case, this should never happen if the balancer works propertly // in best case, this should never happen if the balancer works propertly
// this is only to protection against the worst case, where the crawler could // this is only to protection against the worst case, where the crawler could
// behave in a DoS-manner // behave in a DoS-manner
serverLog.logInfo("PLASMA BALANCER", "forcing fetch delay of " + sleeptime + " millisecond for " + crawlEntry.url().getHost()); serverLog.logInfo("BALANCER", "forcing fetch delay of " + sleeptime + " millisecond for " + crawlEntry.url().getHost());
try {synchronized(this) { this.wait(sleeptime); }} catch (final InterruptedException e) {} try {synchronized(this) { this.wait(sleeptime); }} catch (final InterruptedException e) {}
} }

@ -39,6 +39,7 @@ import java.util.TreeSet;
import de.anomic.kelondro.kelondroRow.Entry; import de.anomic.kelondro.kelondroRow.Entry;
import de.anomic.server.serverMemory; import de.anomic.server.serverMemory;
import de.anomic.server.logging.serverLog;
/* /*
* The EcoIndex builds upon the EcoFS and tries to reduce the number of IO requests that the * The EcoIndex builds upon the EcoFS and tries to reduce the number of IO requests that the
@ -106,21 +107,21 @@ public class kelondroEcoTable implements kelondroIndex {
((useTailCache == tailCacheForceUsage) || ((useTailCache == tailCacheForceUsage) ||
((useTailCache == tailCacheUsageAuto) && (serverMemory.free() > neededRAM4table + 200 * 1024 * 1024)))) ? ((useTailCache == tailCacheUsageAuto) && (serverMemory.free() > neededRAM4table + 200 * 1024 * 1024)))) ?
new kelondroRowSet(taildef, records) : null; new kelondroRowSet(taildef, records) : null;
System.out.println("*** DEBUG " + tablefile + ": available RAM: " + (serverMemory.available() / 1024 / 1024) + "MB, allocating space for " + records + " entries"); serverLog.logInfo("ECOTABLE", "initialization of " + tablefile + ": available RAM: " + (serverMemory.available() / 1024 / 1024) + "MB, allocating space for " + records + " entries");
final long neededRAM4index = 2 * 1024 * 1024 + records * (rowdef.primaryKeyLength + 4) * 3 / 2; final long neededRAM4index = 2 * 1024 * 1024 + records * (rowdef.primaryKeyLength + 4) * 3 / 2;
if (!serverMemory.request(neededRAM4index, false)) { if (!serverMemory.request(neededRAM4index, false)) {
// despite calculations seemed to show that there is enough memory for the table AND the index // despite calculations seemed to show that there is enough memory for the table AND the index
// there is now not enough memory left for the index. So delete the table again to free the memory // there is now not enough memory left for the index. So delete the table again to free the memory
// for the index // for the index
System.out.println("*** DEBUG " + tablefile + ": not enough RAM (" + (serverMemory.available() / 1024 / 1024) + "MB) left for index, deleting allocated table space to enable index space allocation (needed: " + (neededRAM4index / 1024 / 1024) + "MB)"); serverLog.logSevere("ECOTABLE", tablefile + ": not enough RAM (" + (serverMemory.available() / 1024 / 1024) + "MB) left for index, deleting allocated table space to enable index space allocation (needed: " + (neededRAM4index / 1024 / 1024) + "MB)");
table = null; System.gc(); table = null; System.gc();
System.out.println("*** DEBUG " + tablefile + ": RAM after releasing the table: " + (serverMemory.available() / 1024 / 1024) + "MB"); serverLog.logSevere("ECOTABLE", tablefile + ": RAM after releasing the table: " + (serverMemory.available() / 1024 / 1024) + "MB");
} }
index = new kelondroBytesIntMap(rowdef.primaryKeyLength, rowdef.objectOrder, records); index = new kelondroBytesIntMap(rowdef.primaryKeyLength, rowdef.objectOrder, records);
System.out.println("*** DEBUG " + tablefile + ": EcoTable " + tablefile.toString() + " has table copy " + ((table == null) ? "DISABLED" : "ENABLED")); serverLog.logInfo("ECOTABLE", tablefile + ": EcoTable " + tablefile.toString() + " has table copy " + ((table == null) ? "DISABLED" : "ENABLED"));
// read all elements from the file into the copy table // read all elements from the file into the copy table
System.out.print("*** initializing RAM index for EcoTable " + tablefile.getName() + ":"); serverLog.logInfo("ECOTABLE", "initializing RAM index for EcoTable " + tablefile.getName() + ", please wait.");
int i = 0; int i = 0;
byte[] key; byte[] key;
if (table == null) { if (table == null) {
@ -133,11 +134,12 @@ public class kelondroEcoTable implements kelondroIndex {
if (key == null) {i++; continue;} if (key == null) {i++; continue;}
if (!index.addi(key, i++)) fail++; if (!index.addi(key, i++)) fail++;
assert index.size() + fail == i : "index.size() = " + index.size() + ", i = " + i + ", fail = " + fail + ", key = '" + new String(key) + "'"; assert index.size() + fail == i : "index.size() = " + index.size() + ", i = " + i + ", fail = " + fail + ", key = '" + new String(key) + "'";
/*
if ((i % 10000) == 0) { if ((i % 10000) == 0) {
System.out.print('.'); System.out.print('.');
System.out.flush(); System.out.flush();
} }
*/
} }
} else { } else {
byte[] record; byte[] record;
@ -154,23 +156,24 @@ public class kelondroEcoTable implements kelondroIndex {
// write the tail into the table // write the tail into the table
table.addUnique(taildef.newEntry(record, rowdef.primaryKeyLength, true)); table.addUnique(taildef.newEntry(record, rowdef.primaryKeyLength, true));
/*
if ((i % 10000) == 0) { if ((i % 10000) == 0) {
System.out.print('.'); System.out.print('.');
System.out.flush(); System.out.flush();
} }
*/
} }
} }
// check consistency // check consistency
System.out.print(" -ordering- .."); //System.out.print(" -ordering- ..");
System.out.flush(); //System.out.flush();
this.file = new kelondroBufferedEcoFS(new kelondroEcoFS(tablefile, rowdef.objectsize), this.buffersize); this.file = new kelondroBufferedEcoFS(new kelondroEcoFS(tablefile, rowdef.objectsize), this.buffersize);
final ArrayList<Integer[]> doubles = index.removeDoubles(); final ArrayList<Integer[]> doubles = index.removeDoubles();
//assert index.size() + doubles.size() + fail == i; //assert index.size() + doubles.size() + fail == i;
System.out.println(" -removed " + doubles.size() + " doubles- done."); //System.out.println(" -removed " + doubles.size() + " doubles- done.");
if (doubles.size() > 0) { if (doubles.size() > 0) {
System.out.println("DEBUG " + tablefile + ": WARNING - EcoTable " + tablefile + " has " + doubles.size() + " doubles"); serverLog.logInfo("ECOTABLE", tablefile + ": WARNING - EcoTable " + tablefile + " has " + doubles.size() + " doubles");
// from all the doubles take one, put it back to the index and remove the others from the file // from all the doubles take one, put it back to the index and remove the others from the file
// first put back one element each // first put back one element each
final byte[] record = new byte[rowdef.objectsize]; final byte[] record = new byte[rowdef.objectsize];

@ -142,16 +142,21 @@ public class kelondroMergeIterator<E> implements kelondroCloneableIterator<E> {
final Class<?> c = Class.forName("de.anomic.kelondro.kelondroMergeIterator"); final Class<?> c = Class.forName("de.anomic.kelondro.kelondroMergeIterator");
meth = c.getMethod("mergeEqualByReplace", new Class[]{Object.class, Object.class}); meth = c.getMethod("mergeEqualByReplace", new Class[]{Object.class, Object.class});
} catch (final SecurityException e) { } catch (final SecurityException e) {
System.out.println("Error while initializing simpleMerge: " + e.getMessage()); System.out.println("Error while initializing simpleMerge (1): " + e.getMessage());
meth = null; meth = null;
} catch (final ClassNotFoundException e) { } catch (final ClassNotFoundException e) {
System.out.println("Error while initializing simpleMerge: " + e.getMessage()); System.out.println("Error while initializing simpleMerge (2): " + e.getMessage());
meth = null; meth = null;
} catch (final NoSuchMethodException e) { } catch (final NoSuchMethodException e) {
System.out.println("Error while initializing simpleMerge: " + e.getMessage()); System.out.println("Error while initializing simpleMerge (3): " + e.getMessage());
meth = null; meth = null;
} }
simpleMerge = meth; simpleMerge = meth;
} }
// do not remove the following method, it is not reference anywhere directly but indirectly using reflection
// please see initialization of simpleMerge above
public static Object mergeEqualByReplace(final Object a, final Object b) {
return a;
}
} }

@ -824,6 +824,7 @@ public final class plasmaWordIndex implements indexRI {
language = entry.url().language(); language = entry.url().language();
} else { } else {
System.out.println("*** DEBUG LANGUAGE: identification of " + entry.url() + " SUCCESS: " + language); System.out.println("*** DEBUG LANGUAGE: identification of " + entry.url() + " SUCCESS: " + language);
if (language.equals("pl")) language = entry.url().language(); // patch a bug TODO: remove this if bug is fixed
} }
// create a new loaded URL db entry // create a new loaded URL db entry

@ -50,7 +50,9 @@ public class serverMemory {
final long elapsed = System.currentTimeMillis() - lastGC; final long elapsed = System.currentTimeMillis() - lastGC;
if (elapsed > last) { if (elapsed > last) {
final long free = free(); final long free = free();
System.out.println("vvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvv");
System.gc(); System.gc();
System.out.println("^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ if you see this many times please report to forum");
lastGC = System.currentTimeMillis(); lastGC = System.currentTimeMillis();
if (log.isFine()) log.logInfo("[gc] before: " + bytesToString(free) + ", after: " + bytesToString(free()) + ", call: " + info); if (log.isFine()) log.logInfo("[gc] before: " + bytesToString(free) + ", after: " + bytesToString(free()) + ", call: " + info);
} else if (log.isFine()) { } else if (log.isFine()) {

Loading…
Cancel
Save