// WebStructurePicture.java // (C) 2007 by Michael Peter Christen; mc@yacy.net, Frankfurt a. M., Germany // first published 22.05.2007 on http://yacy.net // // This is a part of YaCy, a peer-to-peer based web search engine // // $LastChangedDate$ // $LastChangedRevision$ // $LastChangedBy$ // // LICENSE // // This program is free software; you can redistribute it and/or modify // it under the terms of the GNU General Public License as published by // the Free Software Foundation; either version 2 of the License, or // (at your option) any later version. // // This program is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the // GNU General Public License for more details. // // You should have received a copy of the GNU General Public License // along with this program; if not, write to the Free Software // Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA import java.net.MalformedURLException; import java.util.ArrayList; import java.util.Date; import java.util.HashMap; import java.util.Iterator; import java.util.List; import java.util.Map; import net.yacy.cora.document.ASCII; import net.yacy.cora.protocol.RequestHeader; import net.yacy.kelondro.data.meta.DigestURI; import net.yacy.kelondro.logging.Log; import net.yacy.kelondro.order.Base64Order; import net.yacy.peers.graphics.WebStructureGraph; import net.yacy.search.Switchboard; import net.yacy.visualization.GraphPlotter; import net.yacy.visualization.PrintTool; import net.yacy.visualization.RasterPlotter; import de.anomic.server.serverObjects; import de.anomic.server.serverSwitch; public class WebStructurePicture_p { private static final double maxlongd = Long.MAX_VALUE; public static RasterPlotter respond(final RequestHeader header, final serverObjects post, final serverSwitch env) { final Switchboard sb = (Switchboard) env; String color_text = "888888"; String color_back = "FFFFFF"; String color_dot = "11BB11"; String color_line = "222222"; String color_lineend = "333333"; int width = 1024; int height = 576; int depth = 3; int nodes = 100; // maximum number of host nodes that are painted int time = -1; String host = null; int cyc = 0; if (post != null) { width = post.getInt("width", 1024); height = post.getInt("height", 576); depth = post.getInt("depth", 3); nodes = post.getInt("nodes", width * height * 100 / 1024 / 576); time = post.getInt("time", -1); host = post.get("host", null); color_text = post.get("colortext", color_text); color_back = post.get("colorback", color_back); color_dot = post.get("colordot", color_dot); color_line = post.get("colorline", color_line); color_lineend = post.get("colorlineend", color_lineend); cyc = post.getInt("cyc", 0); } // too small values lead to an error, too big to huge CPU/memory consumption, resulting in possible DOS. if (width < 32 ) width = 32; if (width > 10000) width = 10000; if (height < 24) height = 24; if (height > 10000) height = 10000; if (depth > 8) depth = 8; if (depth < 0) depth = 0; // calculate target time final long timeout = (time < 0) ? Long.MAX_VALUE : System.currentTimeMillis() + (time * 8 / 10); // find start point if ((host == null) || (host.length() == 0) || (host.equals("auto"))) { // find domain with most references host = sb.webStructure.hostWithMaxReferences(); } final RasterPlotter graphPicture; if (host == null) { // probably no information available final RasterPlotter.DrawMode drawMode = (RasterPlotter.darkColor(color_back)) ? RasterPlotter.DrawMode.MODE_ADD : RasterPlotter.DrawMode.MODE_SUB; graphPicture = new RasterPlotter(width, height, drawMode, color_back); PrintTool.print(graphPicture, width / 2, height / 2, 0, "NO WEB STRUCTURE DATA AVAILABLE.", 0); PrintTool.print(graphPicture, width / 2, height / 2 + 16, 0, "START A WEB CRAWL TO OBTAIN STRUCTURE DATA.", 0); } else { // find start hash String hash = null; if (host != null && host.length() > 0) try { hash = ASCII.String((new DigestURI("http://" + host)).hash(), 6, 6); } catch (final MalformedURLException e) {Log.logException(e);} //assert (sb.webStructure.outgoingReferences(hash) != null); // recursively find domains, up to a specific depth GraphPlotter graph = new GraphPlotter(); if (host != null && hash != null) place(graph, sb.webStructure, hash, host, nodes, timeout, 0.0, 0.0, 0, depth, cyc); //graph.print(); // apply physics to it to get a better shape if (post != null && post.containsKey("pa")) { // test with: http://localhost:8090/WebStructurePicture_p.png?pa=10&ral=0.7&raa=0.001&rar=0.0002&rel=0.25&rea=0.1&rer=0.0001 GraphPlotter.Ribbon rAll = new GraphPlotter.Ribbon(post.getFloat("ral", 0.1f), post.getFloat("raa", 0.1f), post.getFloat("rar", 0.1f)); GraphPlotter.Ribbon rEdge = new GraphPlotter.Ribbon(post.getFloat("rel", 0.05f), post.getFloat("rea", 0.1f), post.getFloat("rer", 0.1f)); for (int i = 0; i < post.getInt("pa", 1); i++) graph = graph.physics(rAll, rEdge); } // draw the graph graphPicture = graph.draw(width, height, 40, 40, 16, 16, color_back, color_dot, color_line, color_lineend, color_text); } // print headline graphPicture.setColor(color_text); PrintTool.print(graphPicture, 2, 8, 0, "YACY WEB-STRUCTURE ANALYSIS", -1); if (host != null) PrintTool.print(graphPicture, 2, 16, 0, "LINK ENVIRONMENT OF DOMAIN " + host.toUpperCase(), -1); PrintTool.print(graphPicture, width - 2, 8, 0, "SNAPSHOT FROM " + new Date().toString().toUpperCase(), 1); return graphPicture; } private static final int place( final GraphPlotter graph, final WebStructureGraph structure, final String centerhash, final String centerhost, int maxnodes, final long timeout, final double x, final double y, int nextlayer, final int maxlayer, final int cyc) { // returns the number of nodes that had been placed assert centerhost != null; final GraphPlotter.Point center = graph.getNode(centerhost); int mynodes = 0; if (center == null) { graph.addNode(centerhost, x, y, nextlayer); maxnodes--; mynodes++; } if (nextlayer == maxlayer) return mynodes; nextlayer++; final double radius = 1.0 / (1 << nextlayer); final WebStructureGraph.StructureEntry sr = structure.outgoingReferences(centerhash); final Map next = (sr == null) ? new HashMap() : sr.references; Map.Entry entry; String targethash, targethost; // first set points to next hosts final Iterator> i = next.entrySet().iterator(); final List targets = new ArrayList(); int maxtargetrefs = 8, maxthisrefs = 8; int targetrefs, thisrefs; double rr, re; while (i.hasNext() && maxnodes > 0 && System.currentTimeMillis() < timeout) { entry = i.next(); targethash = entry.getKey(); targethost = structure.hostHash2hostName(targethash); if (targethost == null) continue; thisrefs = entry.getValue().intValue(); targetrefs = structure.referencesCount(targethash); // can be cpu/time-critical maxtargetrefs = Math.max(targetrefs, maxtargetrefs); maxthisrefs = Math.max(thisrefs, maxthisrefs); targets.add(new String[] {targethash, targethost}); if (graph.getNode(targethost) != null) continue; // set a new point. It is placed on a circle around the host point final double angle = ((Base64Order.enhancedCoder.cardinal((targethash + "____").getBytes()) / maxlongd) + (cyc / 360.0d)) * 2.0d * Math.PI; //System.out.println("ANGLE = " + angle); rr = radius * 0.25 * (1 - targetrefs / (double) maxtargetrefs); re = radius * 0.5 * (thisrefs / (double) maxthisrefs); graph.addNode(targethost, x + (radius - rr - re) * Math.cos(angle), y + (radius - rr - re) * Math.sin(angle), nextlayer); maxnodes--; mynodes++; } // recursively set next hosts final Iterator j = targets.iterator(); String[] target; int nextnodes; while (j.hasNext()) { target = j.next(); targethash = target[0]; targethost = target[1]; final GraphPlotter.Point c = graph.getNode(targethost); assert c != null; nextnodes = ((maxnodes <= 0) || (System.currentTimeMillis() >= timeout)) ? 0 : place(graph, structure, targethash, targethost, maxnodes, timeout, c.x, c.y, nextlayer, maxlayer, cyc); mynodes += nextnodes; maxnodes -= nextnodes; graph.setEdge(centerhost, targethost); } return mynodes; } }