parent
000dde9511
commit
dd7782bac0
@ -0,0 +1,117 @@
|
|||||||
|
// BinSearch.java
|
||||||
|
// -----------------------
|
||||||
|
// part of The Kelondro Database
|
||||||
|
// (C) by Michael Peter Christen; mc@yacy.net
|
||||||
|
// first published on http://www.anomic.de
|
||||||
|
// Frankfurt, Germany, 2005
|
||||||
|
// created 22.11.2005
|
||||||
|
//
|
||||||
|
// $LastChangedDate$
|
||||||
|
// $LastChangedRevision$
|
||||||
|
// $LastChangedBy$
|
||||||
|
//
|
||||||
|
// This program is free software; you can redistribute it and/or modify
|
||||||
|
// it under the terms of the GNU General Public License as published by
|
||||||
|
// the Free Software Foundation; either version 2 of the License, or
|
||||||
|
// (at your option) any later version.
|
||||||
|
//
|
||||||
|
// This program is distributed in the hope that it will be useful,
|
||||||
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
// GNU General Public License for more details.
|
||||||
|
//
|
||||||
|
// You should have received a copy of the GNU General Public License
|
||||||
|
// along with this program; if not, write to the Free Software
|
||||||
|
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
||||||
|
|
||||||
|
package net.yacy.kelondro.index;
|
||||||
|
|
||||||
|
import java.io.File;
|
||||||
|
import java.io.FileOutputStream;
|
||||||
|
import java.io.IOException;
|
||||||
|
import java.util.Arrays;
|
||||||
|
import java.util.List;
|
||||||
|
|
||||||
|
import net.yacy.cora.order.ByteOrder;
|
||||||
|
import net.yacy.cora.order.NaturalOrder;
|
||||||
|
|
||||||
|
|
||||||
|
public final class BinSearch {
|
||||||
|
|
||||||
|
private final byte[] chunks;
|
||||||
|
private final int chunksize;
|
||||||
|
private final int count;
|
||||||
|
private static final ByteOrder objectOrder = new NaturalOrder(true); // the natural order is much faster than the b64Order
|
||||||
|
|
||||||
|
public BinSearch(final byte[] chunks, final int chunksize) {
|
||||||
|
this.chunks = chunks;
|
||||||
|
this.chunksize = chunksize;
|
||||||
|
this.count = chunks.length / chunksize;
|
||||||
|
}
|
||||||
|
|
||||||
|
public BinSearch(final List<byte[]> chunkList, final int chunksize) {
|
||||||
|
byte[][] chunksa = new byte[chunkList.size()][];
|
||||||
|
chunksa = chunkList.toArray(chunksa);
|
||||||
|
Arrays.sort(chunksa, objectOrder);
|
||||||
|
this.chunks = new byte[chunkList.size() * chunksize];
|
||||||
|
for (int i = 0; i < chunksa.length; i++) System.arraycopy(chunksa[i], 0, this.chunks, i * chunksize, chunksize);
|
||||||
|
this.chunksize = chunksize;
|
||||||
|
this.count = chunks.length / chunksize;
|
||||||
|
assert this.count == chunkList.size();
|
||||||
|
}
|
||||||
|
|
||||||
|
public final boolean contains(final byte[] t) {
|
||||||
|
return contains(t, 0, this.count);
|
||||||
|
}
|
||||||
|
|
||||||
|
private final boolean contains(final byte[] t, int beginPos, int endPos) {
|
||||||
|
// the endPos is exclusive, beginPos is inclusive
|
||||||
|
// this method is synchronized to make the use of the buffer possible
|
||||||
|
assert t.length == this.chunksize;
|
||||||
|
while (true) {
|
||||||
|
if (beginPos >= endPos) return false;
|
||||||
|
final int pivot = (beginPos + endPos) / 2;
|
||||||
|
if ((pivot < 0) || (pivot >= this.count)) return false;
|
||||||
|
assert this.chunksize == t.length;
|
||||||
|
final int c = objectOrder.compare(this.chunks, pivot * this.chunksize, t, 0, this.chunksize);
|
||||||
|
if (c == 0) return true;
|
||||||
|
if (c < 0) /* buffer < t */ {beginPos = pivot + 1; continue;}
|
||||||
|
if (c > 0) /* buffer > t */ {endPos = pivot; continue;}
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public final int size() {
|
||||||
|
return count;
|
||||||
|
}
|
||||||
|
|
||||||
|
public final byte[] get(final int element) {
|
||||||
|
final byte[] a = new byte[chunksize];
|
||||||
|
System.arraycopy(this.chunks, element * this.chunksize, a, 0, chunksize);
|
||||||
|
return a;
|
||||||
|
}
|
||||||
|
|
||||||
|
public final byte[] get(final int element, byte[] a) {
|
||||||
|
assert a.length == chunksize;
|
||||||
|
System.arraycopy(this.chunks, element * this.chunksize, a, 0, chunksize);
|
||||||
|
return a;
|
||||||
|
}
|
||||||
|
|
||||||
|
public final void write(File f) throws IOException {
|
||||||
|
FileOutputStream os = new FileOutputStream(f);
|
||||||
|
os.write(this.chunks);
|
||||||
|
os.flush();
|
||||||
|
os.close();
|
||||||
|
}
|
||||||
|
|
||||||
|
public static void main(final String[] args) {
|
||||||
|
final String s = "4CEvsI8FRczRBo_ApRCkwfEbFLn1pIFXg39QGMgj5RHM6HpIMJq67QX3M5iQYr_LyI_5aGDaa_bYbRgJ9XnQjpmq6QkOoGWAoEaihRqhV3kItLFHjRtqauUR";
|
||||||
|
final BinSearch bs = new BinSearch(s.getBytes(), 6);
|
||||||
|
for (int i = 0; i + 6 <= s.length(); i = i + 6) {
|
||||||
|
System.out.println(s.substring(i, i + 6) + ":" + ((bs.contains(s.substring(i, i + 6).getBytes())) ? "drin" : "draussen"));
|
||||||
|
}
|
||||||
|
for (int i = 0; i + 7 <= s.length(); i = i + 6) {
|
||||||
|
System.out.println(s.substring(i + 1, i + 7) + ":" + ((bs.contains(s.substring(i + 1, i + 7).getBytes())) ? "drin" : "draussen"));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
Loading…
Reference in new issue