You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
yacy_search_server/source/net/yacy/kelondro/index/BinSearch.java

118 lines
4.4 KiB

// BinSearch.java
// -----------------------
// part of The Kelondro Database
// (C) by Michael Peter Christen; mc@yacy.net
// first published on http://www.anomic.de
// Frankfurt, Germany, 2005
// created 22.11.2005
//
// $LastChangedDate$
// $LastChangedRevision$
// $LastChangedBy$
//
// This program is free software; you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation; either version 2 of the License, or
// (at your option) any later version.
//
// This program is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
// along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
package net.yacy.kelondro.index;
import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.util.Arrays;
import java.util.List;
import net.yacy.cora.order.ByteOrder;
import net.yacy.kelondro.order.NaturalOrder;
public final class BinSearch {
private final byte[] chunks;
private final int chunksize;
private final int count;
private static final ByteOrder objectOrder = new NaturalOrder(true); // the natural order is much faster than the b64Order
public BinSearch(final byte[] chunks, final int chunksize) {
this.chunks = chunks;
this.chunksize = chunksize;
this.count = chunks.length / chunksize;
}
public BinSearch(final List<byte[]> chunkList, final int chunksize) {
byte[][] chunksa = new byte[chunkList.size()][];
chunksa = chunkList.toArray(chunksa);
Arrays.sort(chunksa, objectOrder);
this.chunks = new byte[chunkList.size() * chunksize];
for (int i = 0; i < chunksa.length; i++) System.arraycopy(chunksa[i], 0, this.chunks, i * chunksize, chunksize);
this.chunksize = chunksize;
this.count = chunks.length / chunksize;
assert this.count == chunkList.size();
}
public final boolean contains(final byte[] t) {
return contains(t, 0, this.count);
}
private final boolean contains(final byte[] t, int beginPos, int endPos) {
// the endPos is exclusive, beginPos is inclusive
// this method is synchronized to make the use of the buffer possible
assert t.length == this.chunksize;
while (true) {
if (beginPos >= endPos) return false;
final int pivot = (beginPos + endPos) / 2;
if ((pivot < 0) || (pivot >= this.count)) return false;
assert this.chunksize == t.length;
final int c = objectOrder.compare(this.chunks, pivot * this.chunksize, t, 0, this.chunksize);
if (c == 0) return true;
if (c < 0) /* buffer < t */ {beginPos = pivot + 1; continue;}
if (c > 0) /* buffer > t */ {endPos = pivot; continue;}
return false;
}
}
public final int size() {
return count;
}
public final byte[] get(final int element) {
final byte[] a = new byte[chunksize];
System.arraycopy(this.chunks, element * this.chunksize, a, 0, chunksize);
return a;
}
public final byte[] get(final int element, byte[] a) {
assert a.length == chunksize;
System.arraycopy(this.chunks, element * this.chunksize, a, 0, chunksize);
return a;
}
public final void write(File f) throws IOException {
FileOutputStream os = new FileOutputStream(f);
os.write(this.chunks);
os.flush();
os.close();
}
public static void main(final String[] args) {
final String s = "4CEvsI8FRczRBo_ApRCkwfEbFLn1pIFXg39QGMgj5RHM6HpIMJq67QX3M5iQYr_LyI_5aGDaa_bYbRgJ9XnQjpmq6QkOoGWAoEaihRqhV3kItLFHjRtqauUR";
final BinSearch bs = new BinSearch(s.getBytes(), 6);
for (int i = 0; i + 6 <= s.length(); i = i + 6) {
System.out.println(s.substring(i, i + 6) + ":" + ((bs.contains(s.substring(i, i + 6).getBytes())) ? "drin" : "draussen"));
}
for (int i = 0; i + 7 <= s.length(); i = i + 6) {
System.out.println(s.substring(i + 1, i + 7) + ":" + ((bs.contains(s.substring(i + 1, i + 7).getBytes())) ? "drin" : "draussen"));
}
}
}