Index: src/plugin/parse-text/src/java/org/apache/nutch/parse/text/TextParser.java
===================================================================
--- src/plugin/parse-text/src/java/org/apache/nutch/parse/text/TextParser.java	(revision 355310)
+++ src/plugin/parse-text/src/java/org/apache/nutch/parse/text/TextParser.java	(working copy)
@@ -44,10 +44,21 @@
       //        character set isn't specified in HTTP header.
       text = new String(content.getContent());    // use default encoding
     }
-
+    Outlink[] outlinks = null;
+    // check for problematic/parasitic non-plain text
+    String first40 = text.substring(0, Math.min(40,text.length()));
+    if (first40.indexOf("%!PS-Adobe") >= 0) {
+      // postscript is not plain text, skip getting outlinks because
+      //    OutlinkExtractor.getOutlinks(text) can take many hours per file on postscript
+      outlinks = new Outlink[0];
+      // also truncate non-plain text
+      text = first40;
+    } else {
+      outlinks = OutlinkExtractor.getOutlinks(text);
+    }
     return new ParseImpl(text,
                          new ParseData(ParseStatus.STATUS_SUCCESS, "",
-                                       OutlinkExtractor.getOutlinks(text),
+                                       outlinks,
                                        metadata));
   }
 }
