bugfix in new URL class, better loggin for domain extraction

git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@2317 6c8d7289-2bf4-0310-a012-ef5d649a1542
19 years ago · 685430a1b5
parent c57b78722b
commit 685430a1b5
2 changed files with 10 additions and 3 deletions
--- a/source/de/anomic/net/URL.java
+++ b/source/de/anomic/net/URL.java
@ -55,8 +55,8 @@ public class URL {
                host = url.substring(p + 3);
                userInfo = null;
            } else {
-                host = url.substring(p + 3, r);
-                userInfo = url.substring(r + 1);
+                host = url.substring(r + 1);
+                userInfo = url.substring(p + 3, r);
            }
            path = "/";
        } else {
--- a/source/yacy.java
+++ b/source/yacy.java
@ -947,6 +947,7 @@ public final class yacy {
            System.out.println("i.e.");
            System.out.println("java -Xms900m -Xmx900m -classpath classes yacy -domlist");
            int c = 0;
+            long start = System.currentTimeMillis();
            while (eiter.hasNext()) {
                try {
                    entry = (plasmaCrawlLURL.Entry) eiter.next();
@ -956,7 +957,13 @@ public final class yacy {
                    // just ignore
                }
                c++;
-                if (c % 10000 == 0) System.out.println(c + " urls checked, " + doms.size() + " domains collected.");
+                if (c % 10000 == 0) {
+                    System.out.println(
+                            c + " urls checked, " +
+                            doms.size() + " domains collected, " +
+                            Runtime.getRuntime().freeMemory() + " freeMem, " + 
+                            ((System.currentTimeMillis() - start) * (pool.loadedURL.size() - c) / c / 60000) + " minutes remaining.");
+                }
            }