bugfix in new URL class, better loggin for domain extraction

git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@2317 6c8d7289-2bf4-0310-a012-ef5d649a1542
pull/1/head
orbiter 19 years ago
parent c57b78722b
commit 685430a1b5

@ -55,8 +55,8 @@ public class URL {
host = url.substring(p + 3);
userInfo = null;
} else {
host = url.substring(p + 3, r);
userInfo = url.substring(r + 1);
host = url.substring(r + 1);
userInfo = url.substring(p + 3, r);
}
path = "/";
} else {

@ -947,6 +947,7 @@ public final class yacy {
System.out.println("i.e.");
System.out.println("java -Xms900m -Xmx900m -classpath classes yacy -domlist");
int c = 0;
long start = System.currentTimeMillis();
while (eiter.hasNext()) {
try {
entry = (plasmaCrawlLURL.Entry) eiter.next();
@ -956,7 +957,13 @@ public final class yacy {
// just ignore
}
c++;
if (c % 10000 == 0) System.out.println(c + " urls checked, " + doms.size() + " domains collected.");
if (c % 10000 == 0) {
System.out.println(
c + " urls checked, " +
doms.size() + " domains collected, " +
Runtime.getRuntime().freeMemory() + " freeMem, " +
((System.currentTimeMillis() - start) * (pool.loadedURL.size() - c) / c / 60000) + " minutes remaining.");
}
}

Loading…
Cancel
Save