parent
a3d38032cb
commit
0758c868c9
@ -0,0 +1,104 @@
|
|||||||
|
/**
|
||||||
|
* HostNavigator.java
|
||||||
|
* (C) 2016 by reger24; https://github.com/reger24
|
||||||
|
*
|
||||||
|
* This is a part of YaCy, a peer-to-peer based web search engine
|
||||||
|
*
|
||||||
|
* LICENSE
|
||||||
|
*
|
||||||
|
* This program is free software; you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
* the Free Software Foundation; either version 2 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU General Public License
|
||||||
|
* along with this program.
|
||||||
|
* If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*/
|
||||||
|
package net.yacy.search.navigator;
|
||||||
|
|
||||||
|
import java.util.Collection;
|
||||||
|
import java.util.Map;
|
||||||
|
import net.yacy.cora.sorting.ReversibleScoreMap;
|
||||||
|
import net.yacy.kelondro.data.meta.URIMetadataNode;
|
||||||
|
import net.yacy.search.query.QueryModifier;
|
||||||
|
import net.yacy.search.schema.CollectionSchema;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Navigator for (internet) host names, removing www. part of url and counting
|
||||||
|
* www.host.org and host.org as same url
|
||||||
|
*/
|
||||||
|
public class HostNavigator extends StringNavigator implements Navigator {
|
||||||
|
|
||||||
|
public HostNavigator(String title, CollectionSchema field) {
|
||||||
|
super(title, field);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void incFacet(Map<String, ReversibleScoreMap<String>> facets) {
|
||||||
|
if (field != null && facets != null && !facets.isEmpty()) {
|
||||||
|
ReversibleScoreMap<String> fcts = facets.get(field.getSolrFieldName());
|
||||||
|
if (fcts != null) {
|
||||||
|
for (String host : fcts) {
|
||||||
|
int hc = fcts.get(host);
|
||||||
|
if (hc == 0) {
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
if (host.startsWith("www.")) {
|
||||||
|
host = host.substring(4);
|
||||||
|
}
|
||||||
|
this.inc(host, hc);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void incDoc(URIMetadataNode doc) {
|
||||||
|
if (field != null) {
|
||||||
|
Object val = doc.getFieldValue(field.getSolrFieldName());
|
||||||
|
if (val != null) {
|
||||||
|
if (val instanceof Collection) {
|
||||||
|
Collection<String> ll = (Collection) val;
|
||||||
|
for (String s : ll) {
|
||||||
|
if (s.startsWith("www.")) {
|
||||||
|
s = s.substring(4);
|
||||||
|
}
|
||||||
|
this.inc(s);
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
String host = (String) val;
|
||||||
|
if (host.startsWith("www.")) {
|
||||||
|
host = host.substring(4);
|
||||||
|
}
|
||||||
|
this.inc(host);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public String getQueryModifier(final String key) {
|
||||||
|
return "site:" + key;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Checks the query modifier.sitehost string
|
||||||
|
*
|
||||||
|
* @param modifier
|
||||||
|
* @param name host name
|
||||||
|
* @return true if contained in modifier.sitehost
|
||||||
|
*/
|
||||||
|
@Override
|
||||||
|
public boolean modifieractive(QueryModifier modifier, String name) {
|
||||||
|
if (modifier.sitehost != null) {
|
||||||
|
return modifier.sitehost.contains(name);
|
||||||
|
}
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
Loading…
Reference in new issue