// Table_API_p.java // ----------------------- // (C) 2010 by Michael Peter Christen; mc@yacy.net // first published 01.02.2010 in Frankfurt, Germany on http://yacy.net // // This program is free software; you can redistribute it and/or modify // it under the terms of the GNU General Public License as published by // the Free Software Foundation; either version 2 of the License, or // (at your option) any later version. // // This program is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the // GNU General Public License for more details. // // You should have received a copy of the GNU General Public License // along with this program; if not, write to the Free Software // Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA import java.io.IOException; import java.text.DateFormat; import java.util.ArrayList; import java.util.Date; import java.util.Iterator; import java.util.List; import java.util.Map; import java.util.Map.Entry; import java.util.Set; import java.util.TreeSet; import java.util.regex.Pattern; import net.yacy.cora.document.encoding.UTF8; import net.yacy.cora.protocol.Domains; import net.yacy.cora.protocol.RequestHeader; import net.yacy.cora.util.ConcurrentLog; import net.yacy.data.WorkTables; import net.yacy.kelondro.blob.Tables; import net.yacy.kelondro.blob.Tables.Row; import net.yacy.search.Switchboard; import net.yacy.search.SwitchboardConstants; import net.yacy.search.query.QueryParams; import net.yacy.server.serverObjects; import net.yacy.server.serverSwitch; public class Table_API_p { public static serverObjects respond(@SuppressWarnings("unused") final RequestHeader header, final serverObjects post, final serverSwitch env) { final Switchboard sb = (Switchboard) env; final serverObjects prop = new serverObjects(); prop.put("showexec", 0); prop.put("showtable", 0); int startRecord = 0; int maximumRecords = 25; Pattern query = QueryParams.catchall_pattern; if (post != null && post.containsKey("startRecord")) { startRecord = post.getInt("startRecord", 0); } if (post != null && post.containsKey("maximumRecords")) { maximumRecords = post.getInt("maximumRecords", 0); } if (post != null && post.containsKey("query") && !post.get("query", "").isEmpty()) { query = Pattern.compile(".*" + post.get("query", "") + ".*"); startRecord = 0; maximumRecords = 1000; } final boolean inline = (post != null && post.getBoolean("inline")); prop.put("inline", (inline) ? 1 : 0); Pattern typefilter = QueryParams.catchall_pattern; if (post != null && post.containsKey("filter") && post.get("filter", "").length() > 0) { typefilter = Pattern.compile(post.get("filter", ".*")); } // process scheduler and event input actions boolean scheduleeventaction = false; // flag if schedule info of row changes String current_pk = ""; // pk of changed schedule data row if (post != null && post.containsKey("scheduleeventaction")) { scheduleeventaction = post.get("scheduleeventaction", "false").equalsIgnoreCase("true"); prop.put("scheduleeventaction", "false"); current_pk = post.get("current_pk", ""); } if (post != null && scheduleeventaction && !current_pk.isEmpty()) { try { Tables.Row row = sb.tables.select(WorkTables.TABLE_API_NAME, current_pk.getBytes()); if (row != null) { String action; // events if (post.containsKey("event_select_" + current_pk) && post.get("event_select_" + current_pk, "off").equals("on")) { row.put(WorkTables.TABLE_API_COL_APICALL_EVENT_KIND, "regular"); row.put(WorkTables.TABLE_API_COL_APICALL_EVENT_ACTION, "startup"); } if (post.containsKey("event_kind_" + current_pk) ) { if ("off".equals(action = post.get("event_kind_" + current_pk, "off"))) { row.put(WorkTables.TABLE_API_COL_DATE_NEXT_EXEC, ""); } row.put(WorkTables.TABLE_API_COL_APICALL_EVENT_KIND, action); } if (post.containsKey("event_action_" + current_pk) ) { row.put(WorkTables.TABLE_API_COL_APICALL_EVENT_ACTION, post.get("event_action_" + current_pk, "startup")); } // scheduler if (post.containsKey("repeat_select_" + current_pk) && post.get("repeat_select_" + current_pk, "off").equals("on")) { row.put(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_TIME, 7); row.put(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_UNIT, "days"); } if (post.containsKey("repeat_time_" + current_pk) ) { if ("off".equals(action = post.get("repeat_time_" + current_pk, "off"))) { row.put(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_TIME, 0); } else { row.put(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_TIME, Integer.parseInt(action)); } } if (post.containsKey("repeat_unit_" + current_pk) ) { action = post.get("repeat_unit_" + current_pk, "seldays"); int time = row.get(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_TIME, 1); row.put(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_UNIT, action.substring(3)); if (action.equals("selminutes") && time > 0 && time < 10) { row.put(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_TIME, 10); } if (action.equals("selminutes") && time > 50) { row.put(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_TIME, 50); } if (action.equals("selhours") && time > 23) { row.put(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_TIME, 23); } if (action.equals("seldays") && time > 30) { row.put(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_TIME, 30); } } // switch scheduler off if event kind is 'regular' final String kind = row.get(WorkTables.TABLE_API_COL_APICALL_EVENT_KIND, "off"); if ("regular".equals(kind)) row.put(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_TIME, 0); WorkTables.calculateAPIScheduler(row, false); sb.tables.update(WorkTables.TABLE_API_NAME, row); } } catch (final Throwable e) { ConcurrentLog.logException(e); } } if (post != null && !post.get("deleterows", "").isEmpty()) { for (final Map.Entry entry : post.entrySet()) { if (entry.getValue().startsWith("mark_")) { try { sb.tables.delete(WorkTables.TABLE_API_NAME, entry.getValue().substring(5).getBytes()); } catch (final IOException e) { ConcurrentLog.logException(e); } } } } if (post != null && !post.get("deleteold", "").isEmpty()) { int days = post.getInt("deleteoldtime", 365); try { Iterator ri = sb.tables.iterator(WorkTables.TABLE_API_NAME); Row row; Date now = new Date(); Date limit = new Date(now.getTime() - 1000L * 60L * 60L * 24L * days); List pkl = new ArrayList(); while (ri.hasNext()) { row = ri.next(); Date d = row.get(WorkTables.TABLE_API_COL_DATE_RECORDING, now); if (d.before(limit)) { pkl.add(row.getPK()); } } for (byte[] pk: pkl) { sb.tables.delete(WorkTables.TABLE_API_NAME, pk); } // store this call as api call; clean the call a bit before Iterator> ei = post.getSolrParams().getMap().entrySet().iterator(); Entry entry; while (ei.hasNext()) { entry = ei.next(); if (entry.getKey().startsWith("event_select")) { ei.remove(); } if (entry.getKey().startsWith("repeat_select")) { ei.remove(); } } sb.tables.recordAPICall(post, "Table_API_p.html", WorkTables.TABLE_API_TYPE_STEERING, "delete API calls older than " + days + " days"); } catch (final IOException e) { ConcurrentLog.logException(e); } } if (post != null && !post.get("execrows", "").isEmpty()) { // create a time-ordered list of events to execute final Set pks = new TreeSet(); for (final Map.Entry entry : post.entrySet()) { if (entry.getValue().startsWith("mark_")) { pks.add(entry.getValue().substring(5)); } } // now call the api URLs and store the result status final Map l = sb.tables.execAPICalls(Domains.LOCALHOST, sb.getLocalPort("port", 8090), pks, sb.getConfig(SwitchboardConstants.ADMIN_ACCOUNT_USER_NAME, "admin"), sb.getConfig(SwitchboardConstants.ADMIN_ACCOUNT_B64MD5, "")); // construct result table prop.put("showexec", l.isEmpty() ? 0 : 1); final Iterator> resultIterator = l.entrySet().iterator(); Map.Entry record; int count = 0; boolean dark = true; while (resultIterator.hasNext()) { record = resultIterator.next(); if (record == null) { continue; } prop.put("showexec_list_" + count + "_dark", ((dark) ? 1 : 0)); dark = !dark; prop.put("showexec_list_" + count + "_status", record.getValue()); prop.put("showexec_list_" + count + "_url", record.getKey()); count++; } prop.put("showexec_list", count); } // generate table prop.put("showtable", 1); prop.put("showtable_inline", inline ? 1 : 0); // insert rows final List table = new ArrayList(maximumRecords); int count = 0; int tablesize = 0; try { tablesize = sb.tables.size(WorkTables.TABLE_API_NAME); final Iterator plainIterator = sb.tables.iterator(WorkTables.TABLE_API_NAME); final Iterator mapIterator = sb.tables.orderBy(plainIterator, -1, WorkTables.TABLE_API_COL_DATE_RECORDING).iterator(); Tables.Row r; boolean dark = true; boolean scheduledactions = false; int c = 0; String type, comment, url; // first prepare a list while (mapIterator.hasNext()) { r = mapIterator.next(); if (r == null) { continue; } type = UTF8.String(r.get(WorkTables.TABLE_API_COL_TYPE)); if (!typefilter.matcher(type).matches()) { continue; } comment = UTF8.String(r.get(WorkTables.TABLE_API_COL_COMMENT)); url = UTF8.String(r.get(WorkTables.TABLE_API_COL_URL)); if (!(query.matcher(comment).matches() || query.matcher(url).matches())) { continue; } if (c >= startRecord) { table.add(r); } c++; if (table.size() >= maximumRecords) { break; } } // then work on the list for (final Tables.Row row : table) { final Date now = new Date(); final Date date = row.containsKey(WorkTables.TABLE_API_COL_DATE) ? row.get(WorkTables.TABLE_API_COL_DATE, now) : null; final Date date_recording = row.get(WorkTables.TABLE_API_COL_DATE_RECORDING, date); final Date date_last_exec = row.get(WorkTables.TABLE_API_COL_DATE_LAST_EXEC, date); final Date date_next_exec = row.get(WorkTables.TABLE_API_COL_DATE_NEXT_EXEC, (Date) null); final int callcount = row.get(WorkTables.TABLE_API_COL_APICALL_COUNT, 1); prop.put("showtable_list_" + count + "_inline", inline ? 1 : 0); prop.put("showtable_list_" + count + "_dark", dark ? 1 : 0); dark = !dark; prop.put("showtable_list_" + count + "_pk", UTF8.String(row.getPK())); prop.put("showtable_list_" + count + "_count", count); prop.put("showtable_list_" + count + "_callcount", callcount); prop.put("showtable_list_" + count + "_dateRecording", date_recording == null ? "-" : DateFormat.getDateTimeInstance().format(date_recording)); prop.put("showtable_list_" + count + "_dateLastExec", date_last_exec == null ? "-" : DateFormat.getDateTimeInstance().format(date_last_exec)); prop.put("showtable_list_" + count + "_dateNextExec", date_next_exec == null ? "-" : DateFormat.getDateTimeInstance().format(date_next_exec)); prop.put("showtable_list_" + count + "_type", row.get(WorkTables.TABLE_API_COL_TYPE)); prop.put("showtable_list_" + count + "_comment", row.get(WorkTables.TABLE_API_COL_COMMENT)); // check type & action to link crawl start URLs back to CrawlStartExpert.html if (prop.get("showtable_list_" + count + "_type", "").equals(WorkTables.TABLE_API_TYPE_CRAWLER) && prop.get("showtable_list_" + count + "_comment", "").startsWith("crawl start for")) { prop.put("showtable_list_" + count + "_isCrawlerStart", 1); final String editUrl = UTF8.String(row.get(WorkTables.TABLE_API_COL_URL)).replace("Crawler_p", "CrawlStartExpert"); prop.put("showtable_list_" + count + "_isCrawlerStart_url", editUrl); } else { prop.put("showtable_list_" + count + "_isCrawlerStart", 0); } prop.putHTML("showtable_list_" + count + "_inline_url", "http://" + sb.myPublicIP() + ":" + sb.getPublicPort("port", 8090) + UTF8.String(row.get(WorkTables.TABLE_API_COL_URL))); prop.put("showtable_list_" + count + "_scheduler_inline", inline ? "true" : "false"); prop.put("showtable_list_" + count + "_scheduler_filter", typefilter.pattern()); prop.put("showtable_list_" + count + "_scheduler_query", query.pattern()); prop.put("showtable_list_" + count + "_scheduler_startRecord", startRecord); prop.put("showtable_list_" + count + "_scheduler_maximumRecords", maximumRecords); // events final String kind = row.get(WorkTables.TABLE_API_COL_APICALL_EVENT_KIND, "off"); final String action = row.get(WorkTables.TABLE_API_COL_APICALL_EVENT_ACTION, "startup"); prop.put("showtable_list_" + count + "_event_pk", UTF8.String(row.getPK())); boolean schedulerDisabled = "regular".equals(kind); if ("off".equals(kind)) { prop.put("showtable_list_" + count + "_event", 0); } else { prop.put("showtable_list_" + count + "_event", 1); prop.put("showtable_list_" + count + "_event_selectedoff", "off".equals(kind) ? 1 : 0); prop.put("showtable_list_" + count + "_event_selectedonce", "once".equals(kind) ? 1 : 0); prop.put("showtable_list_" + count + "_event_selectedregular", "regular".equals(kind) ? 1 : 0); prop.put("showtable_list_" + count + "_event_selectedstartup", "startup".equals(action) ? 1 : 0); for (int i = 0; i < 24; i++) { String is = Integer.toString(i); if (is.length() == 1) is = "0" + is; is = is + "00"; prop.put("showtable_list_" + count + "_event_selected" + is, is.equals(action) ? 1 : 0); } } // scheduler final String unit = row.get(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_UNIT, "days"); final int time = row.get(WorkTables.TABLE_API_COL_APICALL_SCHEDULE_TIME, 0); prop.put("showtable_list_" + count + "_selectedMinutes", unit.equals("minutes") ? 1 : 0); prop.put("showtable_list_" + count + "_selectedHours", unit.equals("hours") ? 1 : 0); prop.put("showtable_list_" + count + "_selectedDays", (unit.isEmpty() || unit.equals("days")) ? 1 : 0); prop.put("showtable_list_" + count + "_scheduler_pk", UTF8.String(row.getPK())); prop.put("showtable_list_" + count + "_scheduler_disabled", schedulerDisabled ? 1 : 0); prop.put("showtable_list_" + count + "_repeatTime", time); if (time == 0) { prop.put("showtable_list_" + count + "_scheduler", 0); } else { scheduledactions = true; prop.put("showtable_list_" + count + "_scheduler", 1); prop.put("showtable_list_" + count + "_scheduler_scale_" + 0 + "_time", "off"); prop.put("showtable_list_" + count + "_scheduler_selectedMinutes", 0); prop.put("showtable_list_" + count + "_scheduler_selectedHours", 0); prop.put("showtable_list_" + count + "_scheduler_selectedDays", 0); if (unit.equals("minutes")) { for (int i = 1; i <= 5; i++) { prop.put("showtable_list_" + count + "_scheduler_scale_" + i + "_time", i * 10); prop.put("showtable_list_" + count + "_scheduler_scale_" + i + "_selected", 0); } prop.put("showtable_list_" + count + "_scheduler_scale_" + (time / 10) + "_selected", 1); prop.put("showtable_list_" + count + "_scheduler_scale", 6); prop.put("showtable_list_" + count + "_scheduler_selectedMinutes", 1); } else if (unit.equals("hours")) { for (int i = 1; i <= 23; i++) { prop.put("showtable_list_" + count + "_scheduler_scale_" + i + "_time", i); prop.put("showtable_list_" + count + "_scheduler_scale_" + i + "_selected", 0); } prop.put("showtable_list_" + count + "_scheduler_scale_" + time + "_selected", 1); prop.put("showtable_list_" + count + "_scheduler_scale", 24); prop.put("showtable_list_" + count + "_scheduler_selectedHours", 1); } else { for (int i = 1; i <= 30; i++) { prop.put("showtable_list_" + count + "_scheduler_scale_" + i + "_time", i); prop.put("showtable_list_" + count + "_scheduler_scale_" + i + "_selected", 0); } prop.put("showtable_list_" + count + "_scheduler_scale_" + time + "_selected", 1); prop.put("showtable_list_" + count + "_scheduler_scale", 31); prop.put("showtable_list_" + count + "_scheduler_selectedDays", 1); } } count++; } if (scheduledactions) { prop.put("showschedulerhint", 1); prop.put("showschedulerhint_tfminutes", sb.getConfigLong(SwitchboardConstants.CLEANUP_BUSYSLEEP, 300000) / 60000); } else { prop.put("showschedulerhint", 0); } } catch (final IOException e) { ConcurrentLog.logException(e); } prop.put("showtable_list", count); prop.put("showtable_num", count); // write navigation details prop.put("showtable_startRecord", startRecord); prop.put("showtable_maximumRecords", maximumRecords); prop.put("showtable_inline", (inline) ? 1 : 0); prop.put("showtable_filter", typefilter.pattern()); prop.put("showtable_query", query.pattern().replaceAll("\\.\\*", "")); if (tablesize >= maximumRecords) { prop.put("showtable_navigation", 1); prop.put("showtable_navigation_startRecord", startRecord); prop.put("showtable_navigation_to", Math.min(tablesize, startRecord + maximumRecords)); prop.put("showtable_navigation_of", tablesize); prop.put("showtable_navigation_left", startRecord == 0 ? 0 : 1); prop.put("showtable_navigation_left_startRecord", Math.max(0, startRecord - maximumRecords)); prop.put("showtable_navigation_left_maximumRecords", maximumRecords); prop.put("showtable_navigation_left_inline", (inline) ? 1 : 0); prop.put("showtable_navigation_left_filter", typefilter.pattern()); prop.put("showtable_navigation_left", startRecord == 0 ? 0 : 1); prop.put("showtable_navigation_filter", typefilter.pattern()); prop.put("showtable_navigation_right", startRecord + maximumRecords >= tablesize ? 0 : 1); prop.put("showtable_navigation_right_startRecord", Math.min(tablesize - maximumRecords, startRecord + maximumRecords)); prop.put("showtable_navigation_right_maximumRecords", maximumRecords); prop.put("showtable_navigation_right_inline", (inline) ? 1 : 0); prop.put("showtable_navigation_right_filter", typefilter.pattern()); } else { prop.put("showtable_navigation", 0); } // return rewrite properties return prop; } }