Index: nutch-0.8/src/java/org/apache/nutch/parse/OutlinkExtractor.java
===================================================================
--- nutch-0.8/src/java/org/apache/nutch/parse/OutlinkExtractor.java	(revision 434054)
+++ nutch-0.8/src/java/org/apache/nutch/parse/OutlinkExtractor.java	(working copy)
@@ -16,13 +16,14 @@
 
 package org.apache.nutch.parse;
 
+import java.net.MalformedURLException;
 import java.util.ArrayList;
 import java.util.List;
 
 import org.apache.commons.logging.Log;
 import org.apache.commons.logging.LogFactory;
-
 import org.apache.hadoop.conf.Configuration;
+import org.apache.oro.text.regex.MalformedPatternException;
 import org.apache.oro.text.regex.MatchResult;
 import org.apache.oro.text.regex.Pattern;
 import org.apache.oro.text.regex.PatternCompiler;
@@ -108,10 +109,15 @@
         }
         result = matcher.getMatch();
         url = result.group(0);
-        outlinks.add(new Outlink(url, anchor, conf));
+        try {
+          outlinks.add(new Outlink(url, anchor, conf));
+        } catch (MalformedURLException ex) {
+          // if the matcher fails (perhaps a malformed URL) we just log it and move on
+          if (LOG.isErrorEnabled()) { LOG.error("getOutlinks", ex); }
+        }
       }
-    } catch (Exception ex) {
-      // if the matcher fails (perhaps a malformed URL) we just log it and move on
+    } catch (MalformedPatternException ex) {
+      // if we cannot complie the pattern, we just log it and move on
       if (LOG.isErrorEnabled()) { LOG.error("getOutlinks", ex); }
     }
 
