package de.anomic.data; import java.io.IOException; import java.net.MalformedURLException; import java.util.HashSet; import java.util.Iterator; import java.util.Set; import net.yacy.kelondro.blob.Tables; import net.yacy.kelondro.blob.Tables.Data; import net.yacy.kelondro.data.meta.DigestURI; import net.yacy.kelondro.data.word.Word; import net.yacy.kelondro.index.RowSpaceExceededException; import net.yacy.kelondro.logging.Log; public class YMarkTables { public final static String TABLE_BOOKMARKS_BASENAME = "_bookmarks"; public final static String TABLE_BOOKMARKS_LOG = "BOOKMARKS"; public final static String TABLE_BOOKMARKS_USER_ADMIN = "admin"; public final static String TABLE_BOOKMARKS_USER_AUTHENTICATE = "AUTHENTICATE"; public final static String TABLE_BOOKMARKS_USER_AUTHENTICATE_MSG = "Authentication required!"; public final static String TABLE_BOOKMARKS_URL_PROTOCOL_HTTP = "http://"; public final static String TABLE_BOOKMARKS_URL_PROTOCOL_HTTPS = "https://"; public final static String TABLE_BOOKMARKS_COL_ID = "id"; public final static String TABLE_BOOKMARKS_COL_URL = "url"; public final static String TABLE_BOOKMARKS_COL_TITLE = "title"; public final static String TABLE_BOOKMARKS_COL_DESC = "desc"; public final static String TABLE_BOOKMARKS_COL_DATE_ADDED = "added"; public final static String TABLE_BOOKMARKS_COL_DATE_MODIFIED = "modified"; public final static String TABLE_BOOKMARKS_COL_DATE_VISITED = "visited"; public final static String TABLE_BOOKMARKS_COL_PUBLIC = "public"; public final static String TABLE_BOOKMARKS_COL_TAGS = "tags"; public final static String TABLE_BOOKMARKS_COL_VISITS = "visits"; public final static String TABLE_BOOKMARKS_COL_FOLDER = "folder"; public final static String TABLE_BOOKMARKS_COL_DEFAULT = ""; public final static String TABLE_BOOKMARKS_COL_PUBLIC_TRUE = "true"; public final static String TABLE_BOOKMARKS_COL_PUBLIC_FALSE = "false"; public final static String TABLE_BOOKMARKS_COL_VISITS_ZERO = "0"; public final static String TABLE_TAGS_BASENAME = "_tags"; public final static String TABLE_TAGS_SEPARATOR = ","; public final static String TABLE_TAGS_COL_ID = "id"; public final static String TABLE_TAGS_COL_TAG = "tag"; public final static String TABLE_TAGS_COL_URLS = "urls"; public final static int TABLE_TAGS_ACTION_ADD = 1; public final static int TABLE_TAGS_ACTION_REMOVE = 2; public final static String TABLE_FOLDERS_SEPARATOR = "/"; public final static String TABLE_FOLDERS_ROOT = "/"; public final static String TABLE_FOLDERS_UNSORTED = "/unsorted"; public final static String TABLE_FOLDERS_IMPORTED = "/imported"; private Tables worktables; public YMarkTables(final Tables wt) { this.worktables = wt; } public final static byte[] getBookmarkId(String url) throws MalformedURLException { return (new DigestURI(url, null)).hash(); } public final static byte[] getTagId(final String tag) { return Word.word2hash(tag.toLowerCase()); } public final static HashSet getTagSet(final String tagsString, boolean clean) { HashSettagSet = new HashSet(); final String[] tagArray = clean ? cleanTagsString(tagsString).split(TABLE_TAGS_SEPARATOR) : tagsString.split(TABLE_TAGS_SEPARATOR); for (final String tag : tagArray) { tagSet.add(tag); } return tagSet; } public final static HashSet getTagSet(final String tagsString) { return getTagSet(tagsString, true); } public final static HashSet getTagIdSet(final String tagsString, boolean clean) { HashSettagSet = new HashSet(); final String[] tagArray = clean ? cleanTagsString(tagsString).split(TABLE_TAGS_SEPARATOR) : tagsString.split(TABLE_TAGS_SEPARATOR); for (final String tag : tagArray) { tagSet.add(getTagId(tag)); } return tagSet; } public final static Set getTagIdSet(final String tagsString) { return getTagIdSet(tagsString, true); } public final static byte[] keySetToBytes(final HashSet urlSet) { final Iterator urlIter = urlSet.iterator(); final StringBuilder urls = new StringBuilder(); while(urlIter.hasNext()) { urls.append(TABLE_TAGS_SEPARATOR); urls.append(urlIter.next()); } urls.deleteCharAt(0); return urls.toString().getBytes(); } public final static HashSet keysStringToKeySet(final String keysString) { HashSet keySet = new HashSet(); final String[] keyArray = keysString.split(TABLE_TAGS_SEPARATOR); for (final String key : keyArray) { keySet.add(key); } return keySet; } public final static String cleanTagsString(String tagsString) { // get rid of heading, trailing and double commas since they are useless while (tagsString.length() > 0 && tagsString.charAt(0) == TABLE_TAGS_SEPARATOR.charAt(0)) { tagsString = tagsString.substring(1); } while (tagsString.endsWith(TABLE_TAGS_SEPARATOR)) { tagsString = tagsString.substring(0,tagsString.length() -1); } while (tagsString.contains(",,")){ tagsString = tagsString.replaceAll(",,", TABLE_TAGS_SEPARATOR); } // space characters following a comma are removed tagsString = tagsString.replaceAll(",\\s+", TABLE_TAGS_SEPARATOR); return tagsString; } public final static String cleanFoldersString(String foldersString) { foldersString = cleanTagsString(foldersString); // get rid of double and trailing slashes while (foldersString.endsWith("/")){ foldersString = foldersString.substring(0, foldersString.length() -1); } while (foldersString.contains("/,")){ foldersString = foldersString.replaceAll("/,", TABLE_TAGS_SEPARATOR); } while (foldersString.contains("//")){ foldersString = foldersString.replaceAll("//", "/"); } return foldersString; } /** * YMark function that updates the tag index * @param tag_table is the user specific tag index * @param tag is a single tag * @param url is the url has as returned by DigestURI.hash() * @param action is either add (1) or remove (2) * @return */ public int updateTAGTable(final String tag_table, final String tag, final byte[] url, final int action) { Tables.Row tag_row = null; final byte[] tagHash = YMarkTables.getTagId(tag); final String urlHash = new String(url); HashSeturlSet = new HashSet(); try { tag_row = this.worktables.select(tag_table, tagHash); if(tag_row == null) { switch (action) { case YMarkTables.TABLE_TAGS_ACTION_ADD: urlSet.add(urlHash); break; default: return 0; } Data tagEntry = new Data(); tagEntry.put(YMarkTables.TABLE_TAGS_COL_TAG, tag.getBytes()); tagEntry.put(YMarkTables.TABLE_TAGS_COL_URLS, YMarkTables.keySetToBytes(urlSet)); this.worktables.insert(tag_table, tagHash, tagEntry); return 1; } else { urlSet = YMarkTables.keysStringToKeySet(new String(tag_row.get(YMarkTables.TABLE_TAGS_COL_URLS))); if(urlSet.contains(urlHash)) Log.logInfo(YMarkTables.TABLE_BOOKMARKS_LOG, "ok, urlHash found!"); switch (action) { case YMarkTables.TABLE_TAGS_ACTION_ADD: urlSet.add(urlHash); break; case YMarkTables.TABLE_TAGS_ACTION_REMOVE: urlSet.remove(urlHash); if(urlSet.isEmpty()) { this.worktables.delete(tag_table, tagHash); return 1; } break; default: return 1; } tag_row.put(YMarkTables.TABLE_TAGS_COL_URLS, YMarkTables.keySetToBytes(urlSet)); this.worktables.update(tag_table, tag_row); return 1; } } catch (IOException e) { Log.logException(e); } catch (RowSpaceExceededException e) { Log.logException(e); } return 0; } }