diff --git a/source/de/anomic/tools/DidYouMean.java b/source/de/anomic/tools/DidYouMean.java index 2b64d2c63..10f20a3dd 100644 --- a/source/de/anomic/tools/DidYouMean.java +++ b/source/de/anomic/tools/DidYouMean.java @@ -1,13 +1,12 @@ package de.anomic.tools; -import java.util.Comparator; +import java.util.Collections; import java.util.HashSet; -import java.util.Iterator; import java.util.Set; -import java.util.TreeSet; import de.anomic.kelondro.text.IndexCell; import de.anomic.kelondro.text.referencePrototype.WordReference; +import de.anomic.kelondro.util.Log; import de.anomic.plasma.parser.Word; // People make mistakes when they type words. @@ -19,79 +18,127 @@ import de.anomic.plasma.parser.Word; public class DidYouMean { - private static char[] alphabet = {'a','b','c','d','e','f','g','h','i','j','k','l','m','n','o','p', + private static final char[] alphabet = {'a','b','c','d','e','f','g','h','i','j','k','l','m','n','o','p', 'q','r','s','t','u','v','w','x','y','z','\u00e4','\u00f6','\u00fc','\u00df'}; + private static final long TIMEOUT = 2000; + private final Set set; private final IndexCell index; private String word; private int len; + private Thread ChangingOneLetter; + private Thread AddingOneLetter; + private Thread DeletingOneLetter; + private Thread ReversingTwoConsecutiveLetters; + public DidYouMean(final IndexCell index) { - this.set = new HashSet(); + // this.set = Collections.synchronizedSortedSet(new TreeSet(new wordSizeComparator())); + this.set = Collections.synchronizedSet(new HashSet()); this.word = ""; this.len = 0; this.index = index; + + this.ChangingOneLetter = new ChangingOneLetter(); + this.AddingOneLetter = new AddingOneLetter(); + this.DeletingOneLetter = new DeletingOneLetter(); + this.ReversingTwoConsecutiveLetters = new ReversingTwoConsecutiveLetters(); } public Set getSuggestion(final String word) { + long startTime = System.currentTimeMillis(); this.word = word.toLowerCase(); this.len = word.length(); + + this.ChangingOneLetter.start(); + this.AddingOneLetter.start(); + this.DeletingOneLetter.start(); + this.ReversingTwoConsecutiveLetters.start(); - ChangingOneLetter(); - AddingOneLetter(); - DeletingOneLetter(); - ReversingTwoConsecutiveLetters(); + try { + this.ChangingOneLetter.join(TIMEOUT); + this.AddingOneLetter.join(TIMEOUT); + this.DeletingOneLetter.join(TIMEOUT); + this.ReversingTwoConsecutiveLetters.join(TIMEOUT); + } catch (InterruptedException e) { + } - final Iterator it = this.set.iterator(); - final TreeSet rset = new TreeSet(new wordSizeComparator()); - String s; - while(it.hasNext()) { - s = it.next(); - if (index.has(Word.word2hash(s))) { - rset.add(s); - } - } - rset.remove(word.toLowerCase()); - return rset; + this.set.remove(word.toLowerCase()); + Log.logInfo("DidYouMean", "found "+this.set.size()+" terms; execution time: "+(System.currentTimeMillis()-startTime)+"ms"); + + return this.set; + } - private void ChangingOneLetter() { - for(int i=0; i { - + /* + private class wordSizeComparator implements Comparator { public int compare(final String o1, final String o2) { final Integer i1 = index.count(Word.word2hash(o1)); final Integer i2 = index.count(Word.word2hash(o2)); return i2.compareTo(i1); - } - + } } + */ }