// yacysearchitem.java
// (C) 2007 by Michael Peter Christen; mc@yacy.net, Frankfurt a. M., Germany
// first published 28.08.2007 on http://yacy.net
//
// This is a part of YaCy, a peer-to-peer based web search engine
//
// $LastChangedDate: 2006-04-02 22:40:07 +0200 (So, 02 Apr 2006) $
// $LastChangedRevision: 1986 $
// $LastChangedBy: orbiter $
//
// LICENSE
//
// This program is free software; you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation; either version 2 of the License, or
// (at your option) any later version.
//
// This program is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
// along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
import java.io.UnsupportedEncodingException ;
import java.net.MalformedURLException ;
import java.net.URLEncoder ;
import java.util.ArrayList ;
import java.util.TreeSet ;
import de.anomic.http.httpHeader ;
import de.anomic.http.httpRequestHeader ;
import de.anomic.plasma.plasmaProfiling ;
import de.anomic.plasma.plasmaSearchEvent ;
import de.anomic.plasma.plasmaSearchRankingProcess ;
import de.anomic.plasma.plasmaSnippetCache ;
import de.anomic.plasma.plasmaSwitchboard ;
import de.anomic.search.Query ;
import de.anomic.server.serverObjects ;
import de.anomic.server.serverProfiling ;
import de.anomic.server.serverSwitch ;
import de.anomic.tools.crypt ;
import de.anomic.tools.nxTools ;
import de.anomic.tools.Formatter ;
import de.anomic.yacy.yacyNewsPool ;
import de.anomic.yacy.yacySeed ;
import de.anomic.yacy.yacyURL ;
public class yacysearchitem {
private static boolean col = true ;
private static final int namelength = 60 ;
private static final int urllength = 120 ;
public static serverObjects respond ( final httpRequestHeader header , final serverObjects post , final serverSwitch < ? > env ) {
final plasmaSwitchboard sb = ( plasmaSwitchboard ) env ;
final serverObjects prop = new serverObjects ( ) ;
final String eventID = post . get ( "eventID" , "" ) ;
final boolean authenticated = sb . adminAuthenticated ( header ) > = 2 ;
final int item = post . getInt ( "item" , - 1 ) ;
final boolean auth = ( ( String ) header . get ( httpHeader . CONNECTION_PROP_CLIENTIP , "" ) ) . equals ( "localhost" ) | | sb . verifyAuthentication ( header , true ) ;
final int display = ( post = = null ) ? 0 : post . getInt ( "display" , 0 ) ;
// default settings for blank item
prop . put ( "content" , "0" ) ;
prop . put ( "rss" , "0" ) ;
prop . put ( "references" , "0" ) ;
prop . put ( "rssreferences" , "0" ) ;
prop . put ( "dynamic" , "0" ) ;
// find search event
final plasmaSearchEvent theSearch = plasmaSearchEvent . getEvent ( eventID ) ;
if ( theSearch = = null ) {
// the event does not exist, show empty page
return prop ;
}
final Query theQuery = theSearch . getQuery ( ) ;
// dynamically update count values
final int offset = theQuery . neededResults ( ) - theQuery . displayResults ( ) + 1 ;
prop . put ( "offset" , offset ) ;
prop . put ( "itemscount" , ( item < 0 ) ? theQuery . neededResults ( ) : item + 1 ) ;
prop . put ( "totalcount" , Formatter . number ( theSearch . getRankingResult ( ) . getLocalResourceSize ( ) + theSearch . getRankingResult ( ) . getRemoteResourceSize ( ) , true ) ) ;
prop . put ( "localResourceSize" , Formatter . number ( theSearch . getRankingResult ( ) . getLocalResourceSize ( ) , true ) ) ;
prop . put ( "remoteResourceSize" , Formatter . number ( theSearch . getRankingResult ( ) . getRemoteResourceSize ( ) , true ) ) ;
prop . put ( "remoteIndexCount" , Formatter . number ( theSearch . getRankingResult ( ) . getRemoteIndexCount ( ) , true ) ) ;
prop . put ( "remotePeerCount" , Formatter . number ( theSearch . getRankingResult ( ) . getRemotePeerCount ( ) , true ) ) ;
if ( theQuery . contentdom = = Query . CONTENTDOM_TEXT ) {
// text search
// generate result object
final plasmaSearchEvent . ResultEntry result = theSearch . oneResult ( item ) ;
if ( result = = null ) return prop ; // no content
final int port = result . url ( ) . getPort ( ) ;
yacyURL faviconURL = null ;
if ( ! result . url ( ) . isLocal ( ) ) try {
faviconURL = new yacyURL ( result . url ( ) . getProtocol ( ) + "://" + result . url ( ) . getHost ( ) + ( ( port ! = - 1 ) ? ( ":" + String . valueOf ( port ) ) : "" ) + "/favicon.ico" , null ) ;
} catch ( final MalformedURLException e1 ) {
faviconURL = null ;
}
prop . put ( "content" , 1 ) ; // switch on specific content
prop . put ( "content_authorized" , authenticated ? "1" : "0" ) ;
prop . put ( "content_authorized_recommend" , ( sb . peers . newsPool . getSpecific ( yacyNewsPool . OUTGOING_DB , yacyNewsPool . CATEGORY_SURFTIPP_ADD , "url" , result . urlstring ( ) ) = = null ) ? "1" : "0" ) ;
prop . putHTML ( "content_authorized_recommend_deletelink" , "/yacysearch.html?search=" + theQuery . queryString + "&Enter=Search&count=" + theQuery . displayResults ( ) + "&offset=" + ( theQuery . neededResults ( ) - theQuery . displayResults ( ) ) + "&order=" + crypt . simpleEncode ( theQuery . ranking . toExternalString ( ) ) + "&resource=local&time=3&deleteref=" + result . hash ( ) + "&urlmaskfilter=.*" ) ;
prop . putHTML ( "content_authorized_recommend_recommendlink" , "/yacysearch.html?search=" + theQuery . queryString + "&Enter=Search&count=" + theQuery . displayResults ( ) + "&offset=" + ( theQuery . neededResults ( ) - theQuery . displayResults ( ) ) + "&order=" + crypt . simpleEncode ( theQuery . ranking . toExternalString ( ) ) + "&resource=local&time=3&recommendref=" + result . hash ( ) + "&urlmaskfilter=.*" ) ;
prop . put ( "content_authorized_urlhash" , result . hash ( ) ) ;
prop . putHTML ( "content_title" , result . title ( ) ) ;
prop . putXML ( "content_title-xml" , result . title ( ) ) ;
prop . putJSON ( "content_title-json" , result . title ( ) ) ;
prop . putHTML ( "content_link" , result . urlstring ( ) ) ;
prop . put ( "content_display" , display ) ;
prop . putHTML ( "content_faviconCode" , sb . licensedURLs . aquireLicense ( faviconURL ) ) ; // aquire license for favicon url loading
prop . put ( "content_urlhash" , result . hash ( ) ) ;
prop . put ( "content_urlhexhash" , yacySeed . b64Hash2hexHash ( result . hash ( ) ) ) ;
prop . putHTML ( "content_urlname" , nxTools . shortenURLString ( result . urlname ( ) , urllength ) ) ;
prop . put ( "content_date" , plasmaSwitchboard . dateString ( result . modified ( ) ) ) ;
prop . put ( "content_date822" , plasmaSwitchboard . dateString822 ( result . modified ( ) ) ) ;
prop . put ( "content_ybr" , plasmaSearchRankingProcess . ybr ( result . hash ( ) ) ) ;
prop . putHTML ( "content_size" , Integer . toString ( result . filesize ( ) ) ) ; // we don't use putNUM here because that number shall be usable as sorting key. To print the size, use 'sizename'
prop . putHTML ( "content_sizename" , sizename ( result . filesize ( ) ) ) ;
prop . putHTML ( "content_host" , result . url ( ) . getHost ( ) ) ;
prop . putHTML ( "content_file" , result . url ( ) . getFile ( ) ) ;
prop . putHTML ( "content_path" , result . url ( ) . getPath ( ) ) ;
prop . put ( "content_nl" , ( item = = 0 ) ? 0 : 1 ) ;
final TreeSet < String > [ ] query = theQuery . queryWords ( ) ;
yacyURL wordURL = null ;
try {
prop . putHTML ( "content_words" , URLEncoder . encode ( query [ 0 ] . toString ( ) , "UTF-8" ) ) ;
} catch ( final UnsupportedEncodingException e ) { }
prop . putHTML ( "content_former" , theQuery . queryString ) ;
prop . put ( "content_rankingprops" , result . word ( ) . toPropertyForm ( ) + ", domLengthEstimated=" + yacyURL . domLengthEstimation ( result . hash ( ) ) +
( ( yacyURL . probablyRootURL ( result . hash ( ) ) ) ? ", probablyRootURL" : "" ) +
( ( ( wordURL = yacyURL . probablyWordURL ( result . hash ( ) , query [ 0 ] ) ) ! = null ) ? ", probablyWordURL=" + wordURL . toNormalform ( false , true ) : "" ) ) ;
final plasmaSnippetCache . TextSnippet snippet = result . textSnippet ( ) ;
final String desc = ( snippet = = null ) ? "" : snippet . getLineMarked ( theQuery . fullqueryHashes ) ;
prop . put ( "content_description" , desc ) ;
prop . putXML ( "content_description-xml" , desc ) ;
prop . putJSON ( "content_description-json" , desc ) ;
serverProfiling . update ( "SEARCH" , new plasmaProfiling . searchEvent ( theQuery . id ( true ) , plasmaSearchEvent . FINALIZATION + "-" + item , 0 , 0 ) , false ) ;
return prop ;
}
if ( theQuery . contentdom = = Query . CONTENTDOM_IMAGE ) {
// image search; shows thumbnails
prop . put ( "content" , theQuery . contentdom + 1 ) ; // switch on specific content
final plasmaSnippetCache . MediaSnippet ms = theSearch . oneImage ( item ) ;
if ( ms = = null ) {
prop . put ( "content_items" , "0" ) ;
} else {
prop . putHTML ( "content_items_0_hrefCache" , ( auth ) ? "/ViewImage.png?url=" + ms . href . toNormalform ( true , false ) : ms . href . toNormalform ( true , false ) ) ;
prop . putHTML ( "content_items_0_href" , ms . href . toNormalform ( true , false ) ) ;
prop . put ( "content_items_0_code" , sb . licensedURLs . aquireLicense ( ms . href ) ) ;
prop . putHTML ( "content_items_0_name" , shorten ( ms . name , namelength ) ) ;
prop . put ( "content_items_0_attr" , ( ms . attr . equals ( "-1 x -1" ) ) ? "" : "(" + ms . attr + ")" ) ; // attributes, here: original size of image
prop . put ( "content_items_0_source" , ms . source . toNormalform ( true , false ) ) ;
prop . put ( "content_items_0_sourcedom" , ms . source . getHost ( ) ) ;
prop . put ( "content_items" , 1 ) ;
}
return prop ;
}
if ( ( theQuery . contentdom = = Query . CONTENTDOM_AUDIO ) | |
( theQuery . contentdom = = Query . CONTENTDOM_VIDEO ) | |
( theQuery . contentdom = = Query . CONTENTDOM_APP ) ) {
// any other media content
// generate result object
final plasmaSearchEvent . ResultEntry result = theSearch . oneResult ( item ) ;
if ( result = = null ) return prop ; // no content
prop . put ( "content" , theQuery . contentdom + 1 ) ; // switch on specific content
final ArrayList < plasmaSnippetCache . MediaSnippet > media = result . mediaSnippets ( ) ;
if ( item = = 0 ) col = true ;
if ( media ! = null ) {
plasmaSnippetCache . MediaSnippet ms ;
int c = 0 ;
for ( int i = 0 ; i < media . size ( ) ; i + + ) {
ms = media . get ( i ) ;
prop . putHTML ( "content_items_" + i + "_href" , ms . href . toNormalform ( true , false ) ) ;
prop . putHTML ( "content_items_" + i + "_hrefshort" , nxTools . shortenURLString ( ms . href . toNormalform ( true , false ) , urllength ) ) ;
prop . putHTML ( "content_items_" + i + "_name" , shorten ( ms . name , namelength ) ) ;
prop . put ( "content_items_" + i + "_col" , ( col ) ? "0" : "1" ) ;
c + + ;
col = ! col ;
}
prop . put ( "content_items" , c ) ;
} else {
prop . put ( "content_items" , "0" ) ;
}
return prop ;
}
return prop ;
}
private static String shorten ( final String s , final int length ) {
if ( s . length ( ) < = length ) return s ;
final int p = s . lastIndexOf ( '.' ) ;
if ( p < 0 ) return s . substring ( 0 , length - 3 ) + "..." ;
return s . substring ( 0 , length - ( s . length ( ) - p ) - 3 ) + "..." + s . substring ( p ) ;
}
private static String sizename ( int size ) {
if ( size < 1024 ) return size + " bytes" ;
size = size / 1024 ;
if ( size < 1024 ) return size + " kbyte" ;
size = size / 1024 ;
if ( size < 1024 ) return size + " mbyte" ;
size = size / 1024 ;
return size + " gbyte" ;
}
}