From 024f8e9b333d0b5fd95832d851e8e4003fe8224a Mon Sep 17 00:00:00 2001 From: reger Date: Tue, 13 May 2014 01:50:15 +0200 Subject: [PATCH] fix truncated urls containing "," adressing http://mantis.tokeek.de/view.php?id=58 Exclude comma from percent-encoding in MultiProtocolURL (see RFC 1738 2.2 and RFC 3986 2.2) --- source/net/yacy/cora/document/id/MultiProtocolURL.java | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) diff --git a/source/net/yacy/cora/document/id/MultiProtocolURL.java b/source/net/yacy/cora/document/id/MultiProtocolURL.java index b44de1e46..7435bb95c 100644 --- a/source/net/yacy/cora/document/id/MultiProtocolURL.java +++ b/source/net/yacy/cora/document/id/MultiProtocolURL.java @@ -495,8 +495,9 @@ public class MultiProtocolURL implements Serializable, ComparableThe ASCII characters 'a' through 'z', 'A' through 'Z', * and '0' through '9' remain the same. * - *
  • The unreserved characters - _ . ! ~ * ' ( ) remain the same. - * + *
  • The unreserved characters & : - _ . ! ~ * ' ( ) ; , remain the same. + * see RFC 1738 2.2 and RFC 3986 2.2 + * *
  • All other ASCII characters are converted into the * 3-character string "%xy", where xy is * the two-digit hexadecimal representation of the character @@ -529,7 +530,8 @@ public class MultiProtocolURL implements Serializable, Comparable