diff --git src/java/org/apache/nutch/util/URLUtil.java src/java/org/apache/nutch/util/URLUtil.java
index 3fada7b..500f991 100644
--- src/java/org/apache/nutch/util/URLUtil.java
+++ src/java/org/apache/nutch/util/URLUtil.java
@@ -354,13 +354,7 @@ public class URLUtil {
   public static String toUNICODE(String url) {
     try {
       URL u = new URL(url);
-      URI p = new URI(u.getProtocol(),
-        null,
-        IDN.toUnicode(u.getHost()),
-        u.getPort(),
-        u.getPath(),
-        u.getQuery(),
-        u.getRef());
+      URI p = new URI(IDN.toUnicode(u.toString()));
 
       return p.toString();
     }
