git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5588 6c8d7289-2bf4-0310-a012-ef5d649a1542pull/1/head
parent
de610b99ec
commit
6a876ecb88
@ -1,249 +0,0 @@
|
||||
// yacyPeerSelection.java
|
||||
// -------------------------------------
|
||||
// (C) by Michael Peter Christen; mc@yacy.net
|
||||
// first published 05.11.2008 on http://yacy.net
|
||||
// Frankfurt, Germany, 2008
|
||||
//
|
||||
// $LastChangedDate: 2008-09-03 02:30:21 +0200 (Mi, 03 Sep 2008) $
|
||||
// $LastChangedRevision: 5102 $
|
||||
// $LastChangedBy: orbiter $
|
||||
//
|
||||
// This program is free software; you can redistribute it and/or modify
|
||||
// it under the terms of the GNU General Public License as published by
|
||||
// the Free Software Foundation; either version 2 of the License, or
|
||||
// (at your option) any later version.
|
||||
//
|
||||
// This program is distributed in the hope that it will be useful,
|
||||
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
// GNU General Public License for more details.
|
||||
//
|
||||
// You should have received a copy of the GNU General Public License
|
||||
// along with this program; if not, write to the Free Software
|
||||
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
||||
|
||||
package de.anomic.yacy;
|
||||
|
||||
import java.util.HashMap;
|
||||
import java.util.HashSet;
|
||||
import java.util.Iterator;
|
||||
|
||||
import de.anomic.kelondro.order.Base64Order;
|
||||
import de.anomic.kelondro.order.DateFormatter;
|
||||
import de.anomic.kelondro.util.ScoreCluster;
|
||||
import de.anomic.kelondro.util.kelondroException;
|
||||
|
||||
|
||||
/*
|
||||
* this package is a collection of peer selection iterations that had been
|
||||
* part of yacyPeerActions, yacyDHTActions and yacySeedDB
|
||||
*/
|
||||
|
||||
public class yacyPeerSelection {
|
||||
|
||||
public static Iterator<yacySeed> getAcceptRemoteIndexSeeds(yacySeedDB seedDB, final String starthash, int max, boolean alsoMyOwn) {
|
||||
// returns an enumeration of yacySeed-Objects
|
||||
// that have the AcceptRemoteIndex-Flag set
|
||||
// the seeds are enumerated in the right order according DHT
|
||||
return new acceptRemoteIndexSeedEnum(seedDB, starthash, Math.min(max, seedDB.sizeConnected()), alsoMyOwn);
|
||||
}
|
||||
|
||||
private static class acceptRemoteIndexSeedEnum implements Iterator<yacySeed> {
|
||||
|
||||
private Iterator<yacySeed> se;
|
||||
private yacySeed nextSeed;
|
||||
private yacySeedDB seedDB;
|
||||
private HashSet<String> doublecheck;
|
||||
private int remaining;
|
||||
private boolean alsoMyOwn;
|
||||
|
||||
public acceptRemoteIndexSeedEnum(yacySeedDB seedDB, final String starthash, int max, boolean alsoMyOwn) {
|
||||
this.seedDB = seedDB;
|
||||
this.se = getDHTSeeds(seedDB, starthash, yacyVersion.YACY_HANDLES_COLLECTION_INDEX);
|
||||
this.remaining = max;
|
||||
this.doublecheck = new HashSet<String>();
|
||||
this.nextSeed = nextInternal();
|
||||
this.alsoMyOwn = alsoMyOwn && nextSeed != null && (Base64Order.enhancedCoder.compare(seedDB.mySeed().hash.getBytes(), nextSeed.hash.getBytes()) > 0);
|
||||
}
|
||||
|
||||
public boolean hasNext() {
|
||||
return nextSeed != null;
|
||||
}
|
||||
|
||||
private yacySeed nextInternal() {
|
||||
if (this.remaining <= 0) return null;
|
||||
yacySeed s;
|
||||
try {
|
||||
while (se.hasNext()) {
|
||||
s = se.next();
|
||||
if (s == null) return null;
|
||||
if (doublecheck.contains(s.hash)) return null;
|
||||
this.doublecheck.add(s.hash);
|
||||
if (s.getFlagAcceptRemoteIndex()) {
|
||||
this.remaining--;
|
||||
return s;
|
||||
}
|
||||
}
|
||||
} catch (final kelondroException e) {
|
||||
System.out.println("DEBUG acceptRemoteIndexSeedEnum:" + e.getMessage());
|
||||
yacyCore.log.logSevere("database inconsistency (" + e.getMessage() + "), re-set of db.");
|
||||
seedDB.resetActiveTable();
|
||||
return null;
|
||||
}
|
||||
return null;
|
||||
}
|
||||
|
||||
public yacySeed next() {
|
||||
if (alsoMyOwn && Base64Order.enhancedCoder.compare(seedDB.mySeed().hash.getBytes(), nextSeed.hash.getBytes()) < 0) {
|
||||
// take my own seed hash instead the enumeration result
|
||||
alsoMyOwn = false;
|
||||
return seedDB.mySeed();
|
||||
} else {
|
||||
final yacySeed next = nextSeed;
|
||||
nextSeed = nextInternal();
|
||||
return next;
|
||||
}
|
||||
}
|
||||
|
||||
public void remove() {
|
||||
throw new UnsupportedOperationException();
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
public static Iterator<yacySeed> getDHTSeeds(yacySeedDB seedDB, final String firstHash, final float minVersion) {
|
||||
// enumerates seed-type objects: all seeds with starting point in the middle, rotating at the end/beginning
|
||||
return new seedDHTEnum(seedDB, firstHash, minVersion);
|
||||
}
|
||||
|
||||
private static class seedDHTEnum implements Iterator<yacySeed> {
|
||||
|
||||
Iterator<yacySeed> e1, e2;
|
||||
int steps;
|
||||
float minVersion;
|
||||
yacySeedDB seedDB;
|
||||
|
||||
public seedDHTEnum(yacySeedDB seedDB, final String firstHash, final float minVersion) {
|
||||
this.seedDB = seedDB;
|
||||
this.steps = seedDB.sizeConnected();
|
||||
this.minVersion = minVersion;
|
||||
this.e1 = seedDB.seedsConnected(true, false, firstHash, minVersion);
|
||||
this.e2 = null;
|
||||
}
|
||||
|
||||
public boolean hasNext() {
|
||||
return (steps > 0) && ((e2 == null) || (e2.hasNext()));
|
||||
}
|
||||
|
||||
public yacySeed next() {
|
||||
if (steps == 0) return null;
|
||||
steps--;
|
||||
|
||||
if (e1 == null || !e1.hasNext()) {
|
||||
if (e2 == null) {
|
||||
e1 = null;
|
||||
e2 = seedDB.seedsConnected(true, false, null, minVersion);
|
||||
}
|
||||
return e2.next();
|
||||
}
|
||||
|
||||
final yacySeed n = e1.next();
|
||||
if (!(e1.hasNext())) {
|
||||
e1 = null;
|
||||
e2 = seedDB.seedsConnected(true, false, null, minVersion);
|
||||
}
|
||||
return n;
|
||||
}
|
||||
|
||||
public void remove() {
|
||||
throw new UnsupportedOperationException();
|
||||
}
|
||||
}
|
||||
|
||||
public static Iterator<yacySeed> getProvidesRemoteCrawlURLs(yacySeedDB seedDB) {
|
||||
return new providesRemoteCrawlURLsEnum(seedDB);
|
||||
}
|
||||
|
||||
private static class providesRemoteCrawlURLsEnum implements Iterator<yacySeed> {
|
||||
|
||||
Iterator<yacySeed> se;
|
||||
yacySeed nextSeed;
|
||||
yacySeedDB seedDB;
|
||||
|
||||
public providesRemoteCrawlURLsEnum(yacySeedDB seedDB) {
|
||||
this.seedDB = seedDB;
|
||||
se = getDHTSeeds(seedDB, null, yacyVersion.YACY_POVIDES_REMOTECRAWL_LISTS);
|
||||
nextSeed = nextInternal();
|
||||
}
|
||||
|
||||
public boolean hasNext() {
|
||||
return nextSeed != null;
|
||||
}
|
||||
|
||||
private yacySeed nextInternal() {
|
||||
yacySeed s;
|
||||
try {
|
||||
while (se.hasNext()) {
|
||||
s = se.next();
|
||||
if (s == null) return null;
|
||||
if (s.getLong(yacySeed.RCOUNT, 0) > 0) return s;
|
||||
}
|
||||
} catch (final kelondroException e) {
|
||||
System.out.println("DEBUG providesRemoteCrawlURLsEnum:" + e.getMessage());
|
||||
yacyCore.log.logSevere("database inconsistency (" + e.getMessage() + "), re-set of db.");
|
||||
seedDB.resetActiveTable();
|
||||
return null;
|
||||
}
|
||||
return null;
|
||||
}
|
||||
|
||||
public yacySeed next() {
|
||||
final yacySeed next = nextSeed;
|
||||
nextSeed = nextInternal();
|
||||
return next;
|
||||
}
|
||||
|
||||
public void remove() {
|
||||
throw new UnsupportedOperationException();
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
public static HashMap<String, yacySeed> seedsByAge(yacySeedDB seedDB, final boolean up, int count) {
|
||||
// returns a peerhash/yacySeed relation
|
||||
// to get most recent peers, set up = true; for oldest peers, set up = false
|
||||
|
||||
if (count > seedDB.sizeConnected()) count = seedDB.sizeConnected();
|
||||
|
||||
// fill a score object
|
||||
final ScoreCluster<String> seedScore = new ScoreCluster<String>();
|
||||
yacySeed ys;
|
||||
long absage;
|
||||
final Iterator<yacySeed> s = seedDB.seedsConnected(true, false, null, (float) 0.0);
|
||||
int searchcount = 1000;
|
||||
if (searchcount > seedDB.sizeConnected()) searchcount = seedDB.sizeConnected();
|
||||
try {
|
||||
while ((s.hasNext()) && (searchcount-- > 0)) {
|
||||
ys = s.next();
|
||||
if ((ys != null) && (ys.get(yacySeed.LASTSEEN, "").length() > 10)) try {
|
||||
absage = Math.abs(System.currentTimeMillis() + DateFormatter.dayMillis - ys.getLastSeenUTC());
|
||||
seedScore.addScore(ys.hash, (int) absage); // the higher absage, the older is the peer
|
||||
} catch (final Exception e) {}
|
||||
}
|
||||
|
||||
// result is now in the score object; create a result vector
|
||||
final HashMap<String, yacySeed> result = new HashMap<String, yacySeed>();
|
||||
final Iterator<String> it = seedScore.scores(up);
|
||||
int c = 0;
|
||||
while ((c < count) && (it.hasNext())) {
|
||||
c++;
|
||||
ys = seedDB.getConnected(it.next());
|
||||
if ((ys != null) && (ys.hash != null)) result.put(ys.hash, ys);
|
||||
}
|
||||
return result;
|
||||
} catch (final kelondroException e) {
|
||||
yacyCore.log.logSevere("Internal Error at yacySeedDB.seedsByAge: " + e.getMessage(), e);
|
||||
return null;
|
||||
}
|
||||
}
|
||||
}
|
Loading…
Reference in new issue