yacy_search_server/source/net/yacy/kelondro/rwi/AbstractIndex.java

// AbstractIndex.java
// -----------------------------
// (C) 2009 by Michael Peter Christen; mc@yacy.net, Frankfurt a. M., Germany
// first published 15.3.2009 on http://yacy.net
//
// This is a part of YaCy, a peer-to-peer based web search engine
//
// $LastChangedDate: 2006-04-02 22:40:07 +0200 (So, 02 Apr 2006) $
// $LastChangedRevision: 1986 $
// $LastChangedBy: orbiter $
//
// LICENSE
// 
// This program is free software; you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation; either version 2 of the License, or
// (at your option) any later version.
//
// This program is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
// along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA

package net.yacy.kelondro.rwi;

import java.io.IOException;
import java.util.HashMap;
import java.util.Iterator;
import java.util.Set;
import java.util.TreeSet;

import net.yacy.kelondro.index.RowSpaceExceededException;
import net.yacy.kelondro.logging.Log;
import net.yacy.kelondro.order.Order;

public abstract class AbstractIndex <ReferenceType extends Reference> implements Index<ReferenceType> {
    
    final protected ReferenceFactory<ReferenceType> factory;

    public AbstractIndex(final ReferenceFactory<ReferenceType> factory) {
        this.factory = factory;
    }
    
    public int remove(final TreeSet<byte[]> termHashes, final byte[] urlHashBytes) throws IOException {
        // remove the same url hashes for multiple words
        // this is mainly used when correcting a index after a search
        final Iterator<byte[]> i = termHashes.iterator();
        int c = 0;
        while (i.hasNext()) {
            if (remove(i.next(), urlHashBytes)) c++;
        }
        return c;
    }
    
    public synchronized TreeSet<ReferenceContainer<ReferenceType>> references(final byte[] startHash, final boolean rot, int count) throws IOException {
        // creates a set of indexContainers
        // this does not use the cache
        final Order<ReferenceContainer<ReferenceType>> containerOrder = new ReferenceContainerOrder<ReferenceType>(factory, this.ordering().clone());
        final ReferenceContainer<ReferenceType> emptyContainer = ReferenceContainer.emptyContainer(factory, startHash);
        containerOrder.rotate(emptyContainer);
        final TreeSet<ReferenceContainer<ReferenceType>> containers = new TreeSet<ReferenceContainer<ReferenceType>>(containerOrder);
        final Iterator<ReferenceContainer<ReferenceType>> i = references(startHash, rot);
        //if (ram) count = Math.min(size(), count);
        ReferenceContainer<ReferenceType> container;
        // this loop does not terminate using the i.hasNex() predicate when rot == true
        // because then the underlying iterator is a rotating iterator without termination
        // in this case a termination must be ensured with a counter
        // It must also be ensured that the counter is in/decreased every loop
        while ((count > 0) && (i.hasNext())) {
            container = i.next();
            if (container != null && !container.isEmpty()) {
                containers.add(container);
            }
            count--; // decrease counter even if the container was null or empty to ensure termination
        }
        return containers; // this may return less containers as demanded
    }
    
    
    // methods to search in the index
    
    /**
     * collect containers for given word hashes.
     * This collection stops if a single container does not contain any references.
     * In that case only a empty result is returned.
     * @param wordHashes
     * @param urlselection
     * @return map of wordhash:indexContainer
     */
    public HashMap<byte[], ReferenceContainer<ReferenceType>> searchConjunction(final TreeSet<byte[]> wordHashes, final Set<String> urlselection) {
    	// first check if there is any entry that has no match; this uses only operations in ram
    	/*
    	Iterator<byte[]> i = wordHashes.iterator();
        while (i.hasNext()) {
            if (!this.has(i.next())); return new HashMap<byte[], ReferenceContainer<ReferenceType>>(0);
        }
        */
    	// retrieve entities that belong to the hashes
        final HashMap<byte[], ReferenceContainer<ReferenceType>> containers = new HashMap<byte[], ReferenceContainer<ReferenceType>>(wordHashes.size());
        byte[] singleHash;
        ReferenceContainer<ReferenceType> singleContainer;
        final Iterator<byte[]> i = wordHashes.iterator();
        while (i.hasNext()) {
        
            // get next word hash:
            singleHash = i.next();
        
            // retrieve index
            try {
                singleContainer = this.get(singleHash, urlselection);
            } catch (IOException e) {
                Log.logException(e);
                continue;
            }
        
            // check result
            if ((singleContainer == null || singleContainer.isEmpty())) return new HashMap<byte[], ReferenceContainer<ReferenceType>>(0);
        
            containers.put(singleHash, singleContainer);
        }
        return containers;
    }
    
    /**
     * collect containers for given word hashes and join them as they are retrieved.
     * This collection stops if a single container does not contain any references
     * or the current result of the container join results in an empty container.
     * In any fail case only a empty result container is returned.
     * @param wordHashes
     * @param urlselection
     * @param maxDistance the maximum distance that the words in the result may have
     * @return ReferenceContainer the join result
     * @throws RowSpaceExceededException 
     */
    public ReferenceContainer<ReferenceType> searchJoin(final TreeSet<byte[]> wordHashes, final Set<String> urlselection, final int maxDistance) throws RowSpaceExceededException {
        // first check if there is any entry that has no match;
        // this uses only operations in ram
        for (byte[] wordHash: wordHashes) {
            if (!this.has(wordHash)) return ReferenceContainer.emptyContainer(factory, null, 0);
        }
        
        // retrieve entities that belong to the hashes
        ReferenceContainer<ReferenceType> resultContainer = null;
        ReferenceContainer<ReferenceType> singleContainer;
        for (byte[] wordHash: wordHashes) {
            // retrieve index
            try {
                singleContainer = this.get(wordHash, urlselection);
            } catch (IOException e) {
                Log.logException(e);
                continue;
            }
        
            // check result
            if ((singleContainer == null || singleContainer.isEmpty())) return ReferenceContainer.emptyContainer(factory, null, 0);
            if (resultContainer == null) resultContainer = singleContainer; else {
                resultContainer = ReferenceContainer.joinConstructive(factory, resultContainer, singleContainer, maxDistance);
            }
            
            // finish if the result is empty
            if (resultContainer.isEmpty()) return resultContainer;
        }
        return resultContainer;
    }
    
    public TermSearch<ReferenceType> query(
            final TreeSet<byte[]> queryHashes,
            final TreeSet<byte[]> excludeHashes,
            final Set<String> urlselection,
            final ReferenceFactory<ReferenceType> termFactory,
            final int maxDistance) throws RowSpaceExceededException {

        return new TermSearch<ReferenceType>(this, queryHashes, excludeHashes, urlselection, termFactory, maxDistance);
    }
}
refactoring to integrate indexCell data structures git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5718 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`// AbstractIndex.java`
			`// -----------------------------`
			`// (C) 2009 by Michael Peter Christen; mc@yacy.net, Frankfurt a. M., Germany`
			`// first published 15.3.2009 on http://yacy.net`
			`//`
			`// This is a part of YaCy, a peer-to-peer based web search engine`
			`//`
			`// $LastChangedDate: 2006-04-02 22:40:07 +0200 (So, 02 Apr 2006) $`
			`// $LastChangedRevision: 1986 $`
			`// $LastChangedBy: orbiter $`
			`//`
			`// LICENSE`
			`//`
			`// This program is free software; you can redistribute it and/or modify`
			`// it under the terms of the GNU General Public License as published by`
			`// the Free Software Foundation; either version 2 of the License, or`
			`// (at your option) any later version.`
			`//`
			`// This program is distributed in the hope that it will be useful,`
			`// but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`// GNU General Public License for more details.`
			`//`
			`// You should have received a copy of the GNU General Public License`
			`// along with this program; if not, write to the Free Software`
			`// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA`

accumulated classes from different packages into the new rwi package git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6394 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`package net.yacy.kelondro.rwi;`
refactoring to integrate indexCell data structures git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5718 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago
			`import java.io.IOException;`
some refactoring of search methods git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5988 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`import java.util.HashMap;`
refactoring to integrate indexCell data structures git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5718 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`import java.util.Iterator;`
			`import java.util.Set;`
more refactoring git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5722 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`import java.util.TreeSet;`

added extensive memory protection logic to avoid out of memory errors that may be caused by the RowCollection memory allocation function git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6521 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`import net.yacy.kelondro.index.RowSpaceExceededException;`
added about 450 replacements for printStackTrace() methods to pipe such traces into the log at DATA/LOG/ git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6458 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`import net.yacy.kelondro.logging.Log;`
moved kelondro order git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6392 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`import net.yacy.kelondro.order.Order;`

- full abstraction of index content type: the kelondro full text index may now also contain indexes about other content than text, i.e. navigation indexes or reverse linking indexes. - during index joins all word positions are maintained: better ranking for word distance possible; exact phrase match can be implemented soundly git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5804 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`public abstract class AbstractIndex <ReferenceType extends Reference> implements Index<ReferenceType> {`

			`final protected ReferenceFactory<ReferenceType> factory;`

			`public AbstractIndex(final ReferenceFactory<ReferenceType> factory) {`
			`this.factory = factory;`
			`}`
refactoring to integrate indexCell data structures git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5718 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago
redesign of reference hash (URL-hash) parameter hand-over: pass value as byte[], not as String. This should cause that less byte[] <-> String conversions are made during time-critical tasks. This redesign is not yet complete, more to come .. git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6775 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`public int remove(final TreeSet<byte[]> termHashes, final byte[] urlHashBytes) throws IOException {`
refactoring to integrate indexCell data structures git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5718 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`// remove the same url hashes for multiple words`
			`// this is mainly used when correcting a index after a search`
full redesign of index access data model: terms (words) are not any more retrieved by their word hash string, but by a byte[] containing the word hash. this has strong advantages when RWIs are sorted in the ReferenceContainer Cache and compared with the sun.java TreeMap method, which needed getBytes() and new String() transformations before. Many thousands of such conversions are now omitted every second, which increases the indexing speed by a factor of two. git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5812 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`final Iterator<byte[]> i = termHashes.iterator();`
refactoring to integrate indexCell data structures git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5718 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`int c = 0;`
			`while (i.hasNext()) {`
redesign of reference hash (URL-hash) parameter hand-over: pass value as byte[], not as String. This should cause that less byte[] <-> String conversions are made during time-critical tasks. This redesign is not yet complete, more to come .. git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6775 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`if (remove(i.next(), urlHashBytes)) c++;`
refactoring to integrate indexCell data structures git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5718 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`}`
			`return c;`
			`}`

full redesign of index access data model: terms (words) are not any more retrieved by their word hash string, but by a byte[] containing the word hash. this has strong advantages when RWIs are sorted in the ReferenceContainer Cache and compared with the sun.java TreeMap method, which needed getBytes() and new String() transformations before. Many thousands of such conversions are now omitted every second, which increases the indexing speed by a factor of two. git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5812 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`public synchronized TreeSet<ReferenceContainer<ReferenceType>> references(final byte[] startHash, final boolean rot, int count) throws IOException {`
more refactoring git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5722 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`// creates a set of indexContainers`
			`// this does not use the cache`
- full abstraction of index content type: the kelondro full text index may now also contain indexes about other content than text, i.e. navigation indexes or reverse linking indexes. - during index joins all word positions are maintained: better ranking for word distance possible; exact phrase match can be implemented soundly git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5804 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`final Order<ReferenceContainer<ReferenceType>> containerOrder = new ReferenceContainerOrder<ReferenceType>(factory, this.ordering().clone());`
added some modifications recommended by PMD for better performance git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6560 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`final ReferenceContainer<ReferenceType> emptyContainer = ReferenceContainer.emptyContainer(factory, startHash);`
- full abstraction of index content type: the kelondro full text index may now also contain indexes about other content than text, i.e. navigation indexes or reverse linking indexes. - during index joins all word positions are maintained: better ranking for word distance possible; exact phrase match can be implemented soundly git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5804 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`containerOrder.rotate(emptyContainer);`
			`final TreeSet<ReferenceContainer<ReferenceType>> containers = new TreeSet<ReferenceContainer<ReferenceType>>(containerOrder);`
			`final Iterator<ReferenceContainer<ReferenceType>> i = references(startHash, rot);`
more refactoring git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5722 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`//if (ram) count = Math.min(size(), count);`
- full abstraction of index content type: the kelondro full text index may now also contain indexes about other content than text, i.e. navigation indexes or reverse linking indexes. - during index joins all word positions are maintained: better ranking for word distance possible; exact phrase match can be implemented soundly git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5804 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`ReferenceContainer<ReferenceType> container;`
more refactoring git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5722 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`// this loop does not terminate using the i.hasNex() predicate when rot == true`
			`// because then the underlying iterator is a rotating iterator without termination`
			`// in this case a termination must be ensured with a counter`
			`// It must also be ensured that the counter is in/decreased every loop`
			`while ((count > 0) && (i.hasNext())) {`
			`container = i.next();`
replaced _all_ size() == 0 with isEmpty() and all size() > 0 with !isEmpty(). The isEmpty() method is much faster in some cases, especially when used to access badly balanced hashtables where an size() operation becomes a large iteration. git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6510 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`if (container != null && !container.isEmpty()) {`
more refactoring git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5722 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`containers.add(container);`
			`}`
			`count--; // decrease counter even if the container was null or empty to ensure termination`
			`}`
			`return containers; // this may return less containers as demanded`
			`}`
some refactoring of search methods git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5988 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago

			`// methods to search in the index`

			`/**`
tried a fix for the httpd access bug (too many unclosed sessions) git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6362 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`* collect containers for given word hashes.`
			`* This collection stops if a single container does not contain any references.`
some refactoring of search methods git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5988 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`* In that case only a empty result is returned.`
			`* @param wordHashes`
			`* @param urlselection`
			`* @return map of wordhash:indexContainer`
			`*/`
			`public HashMap<byte[], ReferenceContainer<ReferenceType>> searchConjunction(final TreeSet<byte[]> wordHashes, final Set<String> urlselection) {`
			`// first check if there is any entry that has no match; this uses only operations in ram`
			`/*`
			`Iterator<byte[]> i = wordHashes.iterator();`
			`while (i.hasNext()) {`
			`if (!this.has(i.next())); return new HashMap<byte[], ReferenceContainer<ReferenceType>>(0);`
			`}`
			`*/`
			`// retrieve entities that belong to the hashes`
			`final HashMap<byte[], ReferenceContainer<ReferenceType>> containers = new HashMap<byte[], ReferenceContainer<ReferenceType>>(wordHashes.size());`
			`byte[] singleHash;`
			`ReferenceContainer<ReferenceType> singleContainer;`
added some modifications recommended by PMD for better performance git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6560 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`final Iterator<byte[]> i = wordHashes.iterator();`
some refactoring of search methods git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5988 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`while (i.hasNext()) {`

			`// get next word hash:`
			`singleHash = i.next();`

			`// retrieve index`
			`try {`
			`singleContainer = this.get(singleHash, urlselection);`
			`} catch (IOException e) {`
added about 450 replacements for printStackTrace() methods to pipe such traces into the log at DATA/LOG/ git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6458 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`Log.logException(e);`
some refactoring of search methods git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5988 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`continue;`
			`}`

			`// check result`
replaced _all_ size() == 0 with isEmpty() and all size() > 0 with !isEmpty(). The isEmpty() method is much faster in some cases, especially when used to access badly balanced hashtables where an size() operation becomes a large iteration. git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6510 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`if ((singleContainer == null \|\| singleContainer.isEmpty())) return new HashMap<byte[], ReferenceContainer<ReferenceType>>(0);`
some refactoring of search methods git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5988 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago
			`containers.put(singleHash, singleContainer);`
			`}`
			`return containers;`
			`}`

new join method for indexes (not yet used) git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6356 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`/**`
			`* collect containers for given word hashes and join them as they are retrieved.`
tried a fix for the httpd access bug (too many unclosed sessions) git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6362 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`* This collection stops if a single container does not contain any references`
			`* or the current result of the container join results in an empty container.`
new join method for indexes (not yet used) git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6356 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`* In any fail case only a empty result container is returned.`
			`* @param wordHashes`
			`* @param urlselection`
			`* @param maxDistance the maximum distance that the words in the result may have`
			`* @return ReferenceContainer the join result`
added extensive memory protection logic to avoid out of memory errors that may be caused by the RowCollection memory allocation function git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6521 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`* @throws RowSpaceExceededException`
new join method for indexes (not yet used) git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6356 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`*/`
added some modifications recommended by PMD for better performance git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6560 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`public ReferenceContainer<ReferenceType> searchJoin(final TreeSet<byte[]> wordHashes, final Set<String> urlselection, final int maxDistance) throws RowSpaceExceededException {`
tried a fix for the httpd access bug (too many unclosed sessions) git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6362 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`// first check if there is any entry that has no match;`
			`// this uses only operations in ram`
new join method for indexes (not yet used) git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6356 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`for (byte[] wordHash: wordHashes) {`
			`if (!this.has(wordHash)) return ReferenceContainer.emptyContainer(factory, null, 0);`
			`}`

			`// retrieve entities that belong to the hashes`
			`ReferenceContainer<ReferenceType> resultContainer = null;`
			`ReferenceContainer<ReferenceType> singleContainer;`
			`for (byte[] wordHash: wordHashes) {`
			`// retrieve index`
			`try {`
			`singleContainer = this.get(wordHash, urlselection);`
			`} catch (IOException e) {`
added about 450 replacements for printStackTrace() methods to pipe such traces into the log at DATA/LOG/ git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6458 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`Log.logException(e);`
new join method for indexes (not yet used) git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6356 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`continue;`
			`}`

			`// check result`
replaced _all_ size() == 0 with isEmpty() and all size() > 0 with !isEmpty(). The isEmpty() method is much faster in some cases, especially when used to access badly balanced hashtables where an size() operation becomes a large iteration. git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6510 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`if ((singleContainer == null \|\| singleContainer.isEmpty())) return ReferenceContainer.emptyContainer(factory, null, 0);`
new join method for indexes (not yet used) git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6356 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`if (resultContainer == null) resultContainer = singleContainer; else {`
			`resultContainer = ReferenceContainer.joinConstructive(factory, resultContainer, singleContainer, maxDistance);`
			`}`

			`// finish if the result is empty`
replaced _all_ size() == 0 with isEmpty() and all size() > 0 with !isEmpty(). The isEmpty() method is much faster in some cases, especially when used to access badly balanced hashtables where an size() operation becomes a large iteration. git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6510 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`if (resultContainer.isEmpty()) return resultContainer;`
new join method for indexes (not yet used) git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6356 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`}`
			`return resultContainer;`
			`}`

- fixed problem with remote search NPE - more abstraction for search requests git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6015 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`public TermSearch<ReferenceType> query(`
more refactoring to make the segment object easier to use and to be prepared to integrate author navigation git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5992 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`final TreeSet<byte[]> queryHashes,`
			`final TreeSet<byte[]> excludeHashes,`
			`final Set<String> urlselection,`
added some modifications recommended by PMD for better performance git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6560 6c8d7289-2bf4-0310-a012-ef5d649a1542 15 years ago			`final ReferenceFactory<ReferenceType> termFactory,`
			`final int maxDistance) throws RowSpaceExceededException {`
- fixed problem with remote search NPE - more abstraction for search requests git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@6015 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago
			`return new TermSearch<ReferenceType>(this, queryHashes, excludeHashes, urlselection, termFactory, maxDistance);`
more refactoring to make the segment object easier to use and to be prepared to integrate author navigation git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5992 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`}`
refactoring to integrate indexCell data structures git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5718 6c8d7289-2bf4-0310-a012-ef5d649a1542 16 years ago			`}`