|
|
|
@ -170,16 +170,18 @@ public class plasmaSearchRankingProfile {
|
|
|
|
|
ranking += normalizedEntry.quality() << ((Integer) coeff.get(ENTROPY)).intValue();
|
|
|
|
|
ranking += normalizedEntry.virtualAge() << ((Integer) coeff.get(DATE)).intValue();
|
|
|
|
|
ranking += plasmaSearchPreOrder.ybr_p(normalizedEntry.urlHash()) << ((Integer) coeff.get(YBR)).intValue();
|
|
|
|
|
ranking += (normalizedEntry.posintext() == 0) ? 0 : (255 - normalizedEntry.posintext()) << ((Integer) coeff.get(POSINTEXT)).intValue();
|
|
|
|
|
ranking += (normalizedEntry.worddistance() == 0) ? 0 : (255 - normalizedEntry.worddistance()) << ((Integer) coeff.get(WORDDISTANCE)).intValue();
|
|
|
|
|
ranking += (normalizedEntry.posintext() == 0) ? 0 : (256 - normalizedEntry.posintext()) << ((Integer) coeff.get(POSINTEXT)).intValue();
|
|
|
|
|
ranking += (normalizedEntry.worddistance() == 0) ? 0 : (256 - normalizedEntry.worddistance()) << ((Integer) coeff.get(WORDDISTANCE)).intValue();
|
|
|
|
|
ranking += (normalizedEntry.hitcount() == 0) ? 0 : normalizedEntry.hitcount() << ((Integer) coeff.get(HITCOUNT)).intValue();
|
|
|
|
|
ranking += (255 - indexURL.domLengthNormalized(normalizedEntry.urlHash())) << ((Integer) coeff.get(DOMLENGTH)).intValue();
|
|
|
|
|
ranking += (256 - indexURL.domLengthNormalized(normalizedEntry.urlHash())) << ((Integer) coeff.get(DOMLENGTH)).intValue();
|
|
|
|
|
ranking += (indexURL.probablyRootURL(normalizedEntry.urlHash())) ? 16 << ((Integer) coeff.get(URLLENGTH)).intValue() : 0;
|
|
|
|
|
ranking += (indexURL.probablyWordURL(normalizedEntry.urlHash(), searchedWord)) ? 256 << ((Integer) coeff.get(QUERYINURL)).intValue() : 0;
|
|
|
|
|
/*
|
|
|
|
|
if (indexURL.probablyWordURL(normalizedEntry.urlHash(), searchedWord))
|
|
|
|
|
System.out.println("DEBUG - hash " + normalizedEntry.urlHash() + " contains word " + searchedWord + ", weighted " + ((Integer) coeff.get(QUERYINURL)).intValue() + ", ranking = " + ranking);
|
|
|
|
|
else
|
|
|
|
|
System.out.println("DEBUG - hash " + normalizedEntry.urlHash() + " contains not word " + searchedWord + ", ranking = " + ranking);
|
|
|
|
|
*/
|
|
|
|
|
return ranking;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
@ -219,11 +221,11 @@ public class plasmaSearchRankingProfile {
|
|
|
|
|
|
|
|
|
|
// prefer short urls
|
|
|
|
|
ranking += (256 - page.url().toString().length()) << ((Integer) coeff.get(URLLENGTH)).intValue();
|
|
|
|
|
ranking += (32 - urlcomps.length) << ((Integer) coeff.get(URLCOMPS)).intValue();
|
|
|
|
|
ranking += (8 * Math.max(0, 32 - urlcomps.length)) << ((Integer) coeff.get(URLCOMPS)).intValue();
|
|
|
|
|
|
|
|
|
|
// prefer long descriptions
|
|
|
|
|
ranking += (255 * page.descr().length() / 80) << ((Integer) coeff.get(DESCRLENGTH)).intValue();
|
|
|
|
|
ranking += (255 * (12 - Math.abs(12 - Math.min(12, descrcomps.length))) / 12) << ((Integer) coeff.get(DESCRCOMPS)).intValue();
|
|
|
|
|
ranking += (256 * page.descr().length() / 80) << ((Integer) coeff.get(DESCRLENGTH)).intValue();
|
|
|
|
|
ranking += (256 * (12 - Math.abs(12 - Math.min(12, descrcomps.length))) / 12) << ((Integer) coeff.get(DESCRCOMPS)).intValue();
|
|
|
|
|
|
|
|
|
|
return ranking;
|
|
|
|
|
}
|
|
|
|
|