From deadeb406eed1425d0afdf3aef794eec13e92756 Mon Sep 17 00:00:00 2001 From: orbiter Date: Sun, 1 Sep 2013 13:48:10 +0200 Subject: [PATCH] image alt tag strings should be tokenized --- defaults/solr.collection.schema | 2 +- source/net/yacy/search/schema/CollectionConfiguration.java | 2 +- source/net/yacy/search/schema/CollectionSchema.java | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/defaults/solr.collection.schema b/defaults/solr.collection.schema index b16188bb5..e531ac8b5 100644 --- a/defaults/solr.collection.schema +++ b/defaults/solr.collection.schema @@ -249,7 +249,7 @@ images_urlstub_sxt images_protocol_sxt ## all image link alt tag -images_alt_sxt +images_alt_txt ## size of images:height images_height_val diff --git a/source/net/yacy/search/schema/CollectionConfiguration.java b/source/net/yacy/search/schema/CollectionConfiguration.java index 8d5828283..dfb2cafa1 100644 --- a/source/net/yacy/search/schema/CollectionConfiguration.java +++ b/source/net/yacy/search/schema/CollectionConfiguration.java @@ -620,7 +620,7 @@ public class CollectionConfiguration extends SchemaConfiguration implements Seri if (allAttr || contains(CollectionSchema.imagescount_i)) add(doc, CollectionSchema.imagescount_i, imagesc.size()); if (allAttr || contains(CollectionSchema.images_protocol_sxt)) add(doc, CollectionSchema.images_protocol_sxt, protocolList2indexedList(imgprots)); if (allAttr || contains(CollectionSchema.images_urlstub_sxt)) add(doc, CollectionSchema.images_urlstub_sxt, imgstubs); - if (allAttr || contains(CollectionSchema.images_alt_sxt)) add(doc, CollectionSchema.images_alt_sxt, imgalts); + if (allAttr || contains(CollectionSchema.images_alt_txt)) add(doc, CollectionSchema.images_alt_txt, imgalts); if (allAttr || contains(CollectionSchema.images_height_val)) add(doc, CollectionSchema.images_height_val, imgheights); if (allAttr || contains(CollectionSchema.images_width_val)) add(doc, CollectionSchema.images_width_val, imgwidths); if (allAttr || contains(CollectionSchema.images_pixel_val)) add(doc, CollectionSchema.images_pixel_val, imgpixels); diff --git a/source/net/yacy/search/schema/CollectionSchema.java b/source/net/yacy/search/schema/CollectionSchema.java index c05342b65..70721bed4 100644 --- a/source/net/yacy/search/schema/CollectionSchema.java +++ b/source/net/yacy/search/schema/CollectionSchema.java @@ -123,7 +123,7 @@ public enum CollectionSchema implements SchemaDeclaration { images_text_t(SolrType.text_general, true, true, false, false, true, "all text/words appearing in image alt texts or the tokenized url"), images_urlstub_sxt(SolrType.string, true, true, true, false, true, "all image links without the protocol and '://'"), images_protocol_sxt(SolrType.string, true, true, true, false, false, "all image link protocols"), - images_alt_sxt(SolrType.text_general, true, true, true, false, true, "all image link alt tag"), + images_alt_txt(SolrType.text_general, true, true, true, false, true, "all image link alt tag"), images_height_val(SolrType.num_integer, true, true, true, false, false, "size of images:height"), images_width_val(SolrType.num_integer, true, true, true, false, false, "size of images:width"), images_pixel_val(SolrType.num_integer, true, true, true, false, false, "size of images as number of pixels (easier for a search restriction than with and height)"),