htags_i(SolrType.integer,true,true,"binary pattern for the existance of h1..h6 headlines"),
paths_txt(SolrType.text_general,true,true,true,"all path elements in the url"),
host_s(SolrType.string,true,true,"host of the url"),
canonical_s(SolrType.string,true,true,"url inside the canonical link element"),
refresh_s(SolrType.string,true,true,"link from the url property inside the refresh link element"),
metagenerator_t(SolrType.text_general,true,true,"content of <meta name=\"generator\" content=#content#> tag"),
boldcount_i(SolrType.integer,true,true,"total number of occurrences of <b> or <strong>"),
li_txt(SolrType.text_general,true,true,true,"all texts in <li> tags"),
licount_i(SolrType.integer,true,true,"number of <li> tags"),
bold_txt(SolrType.text_general,true,true,true,"all texts inside of <b> or <strong> tags. no doubles. listed in the order of number of occurrences in decreasing order"),
bold_val(SolrType.integer,true,true,true,"number of occurrences of texts in bold_txt"),
italiccount_i(SolrType.integer,true,true,"total number of occurrences of <i>"),
boldcount_i(SolrType.integer,true,true,"total number of occurrences of <b> or <strong>"),
italic_txt(SolrType.text_general,true,true,true,"all texts inside of <i> tags. no doubles. listed in the order of number of occurrences in decreasing order"),
italic_val(SolrType.integer,true,true,true,"number of occurrences of texts in italic_txt"),
licount_i(SolrType.integer,true,true,"number of <li> tags"),
li_txt(SolrType.text_general,true,true,true,"all texts in <li> tags"),
imagescount_i(SolrType.integer,true,true,"number of images"),
images_tag_txt(SolrType.text_general,true,true,true," all image tags, encoded as <img> tag inclusive alt- and title property"),
images_protocol_txt(SolrType.text_general,true,true,true,"all image link protocols"),
images_urlstub_txt(SolrType.text_general,true,true,true,"all image links without the protocol and '://'"),
images_alt_txt(SolrType.text_general,true,true,true,"all image link alt tag"),
csscount_i(SolrType.integer,true,true,"number of entries in css_tag_txt and css_url_txt"),
css_tag_txt(SolrType.text_general,true,true,true,"full css tag with normalized url"),
css_url_txt(SolrType.text_general,true,true,true,"normalized urls within a css tag"),
scripts_txt(SolrType.text_general,true,true,true,"normalized urls within a scripts tag"),
scriptscount_i(SolrType.integer,true,true,"number of entries in scripts_txt"),
italiccount_i(SolrType.integer,true,true,"total number of occurrences of <i>"),
flash_b(SolrType.bool,true,true,"flag that shows if a swf file is linked"),
frames_txt(SolrType.text_general,true,true,true,"list of all links to frames"),
framesscount_i(SolrType.integer,true,true,"number of frames_txt"),
iframes_txt(SolrType.text_general,true,true,true,"list of all links to iframes"),
iframesscount_i(SolrType.integer,true,true,"number of iframes_txt"),
flash_b(SolrType.bool,true,true,"flag that shows if a swf file is linked"),
responsetime_i(SolrType.integer,true,true,"response time of target server in milliseconds"),
ext_cms_txt(SolrType.text_general,true,true,true,"names of cms attributes; if several are recognized then they are listen in decreasing order of number of matching criterias"),
ext_cms_val(SolrType.integer,true,true,true,"number of attributes that count for a specific cms in ext_cms_txt"),
ext_ads_txt(SolrType.text_general,true,true,true,"names of ad-servers/ad-services"),
@ -120,22 +140,8 @@ public enum YaCySchema implements Schema {
ext_tracker_txt(SolrType.text_general,true,true,true,"names of tracker server"),
ext_tracker_val(SolrType.integer,true,true,true,"number of attribute counts in ext_tracker_txt"),
ext_title_txt(SolrType.text_general,true,true,true,"names matching title expressions"),
ext_title_val(SolrType.integer,true,true,true,"number of matching title expressions"),
failreason_t(SolrType.text_general,true,true,"fail reason if a page was not loaded. if the page was loaded then this field is empty"),
// values used additionally by URIMetadataRow
load_date_dt(SolrType.date,true,true,"time when resource was loaded"),
fresh_date_dt(SolrType.date,true,true,"date until resource shall be considered as fresh"),
host_id_s(SolrType.string,true,true,"id of the host, a 6-byte hash that is part of the document id"),// String hosthash();
referrer_id_txt(SolrType.string,true,true,true,"ids of referrer to this document"),// byte[] referrerHash();
md5_s(SolrType.string,true,true,"the md5 of the raw source"),// String md5();
publisher_t(SolrType.text_general,true,true,"the name of the publisher of the document"),// String dc_publisher();
language_txt(SolrType.string,true,true,"the language used in the document; starts with primary language"),// byte[] language();
size_i(SolrType.integer,true,true,"the size of the raw source"),// int size();
audiolinkscount_i(SolrType.integer,true,true,"number of links to audio resources"),// int laudio();
videolinkscount_i(SolrType.integer,true,true,"number of links to video resources"),// int lvideo();
applinkscount_i(SolrType.integer,true,true,"number of links to application resources");// int lapp();
ext_title_val(SolrType.integer,true,true,true,"number of matching title expressions");
privateStringsolrFieldName=null;// solr field name in custom solr schema, defaults to solcell schema field name (= same as this.name() )