Top 50 most common stacktraces in tika_1_6 ordered by count

FILE_EXTENSION DETECTED_FILE_EXTENSION_A SORT_STACK_TRACE_A COUNT
ppt
ppt
org.apache.tika.exception.TikaException: Unexpected RuntimeException from org.apache.tika.parser.microsoft.OfficeParser
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:245)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	a
452
log
xml
org.apache.tika.exception.TikaException: XML parse error
	at org.apache.tika.parser.xml.XMLParser.parse(XMLParser.java:78)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
158
doc
doc
org.apache.tika.exception.TikaException: Unexpected RuntimeException from org.apache.tika.parser.microsoft.OfficeParser
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:245)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	a
138
xls
xls
org.apache.tika.exception.TikaException: TIKA-198: Illegal IOException from org.apache.tika.parser.microsoft.OfficeParser
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:249)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
116
doc
doc
org.apache.tika.exception.TikaException: TIKA-198: Illegal IOException from org.apache.tika.parser.microsoft.OfficeParser
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:249)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
80
html
xml
org.apache.tika.exception.TikaException: XML parse error
	at org.apache.tika.parser.xml.XMLParser.parse(XMLParser.java:78)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
59
pdf
pdf
org.apache.tika.exception.TikaException: Unexpected RuntimeException from org.apache.tika.parser.pdf.PDFParser
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:245)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.ut
48
xml
xml
org.apache.tika.exception.TikaException: XML parse error
	at org.apache.tika.parser.xml.XMLParser.parse(XMLParser.java:78)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
45
xls
xls
org.apache.tika.exception.TikaException: Unexpected RuntimeException from org.apache.tika.parser.microsoft.OfficeParser
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:245)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	a
37
pdf
pdf
org.apache.tika.exception.TikaException: Unable to extract PDF content
	at org.apache.tika.parser.pdf.PDF2XHTML.process(PDF2XHTML.java:144)
	at org.apache.tika.parser.pdf.PDFParser.parse(PDFParser.java:158)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.c
7
pps
ppt
org.apache.tika.exception.TikaException: Unexpected RuntimeException from org.apache.tika.parser.microsoft.OfficeParser
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:245)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	a
5
kml
kml
org.apache.tika.exception.TikaException: XML parse error
	at org.apache.tika.parser.xml.XMLParser.parse(XMLParser.java:78)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
4
ppt
ppt
org.apache.tika.exception.TikaException: TIKA-198: Illegal IOException from org.apache.tika.parser.microsoft.OfficeParser
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:249)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
4
html
html
org.apache.tika.exception.TikaException: Zip bomb detected!
	at org.apache.tika.sax.SecureContentHandler.throwIfCauseOf(SecureContentHandler.java:192)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:124)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1145)
	at java.util.concurrent.ThreadPoolEx
3
pptx
pptx
org.apache.tika.exception.TikaException: Error creating OOXML extractor
	at org.apache.tika.parser.microsoft.ooxml.OOXMLExtractorFactory.parse(OOXMLExtractorFactory.java:122)
	at org.apache.tika.parser.microsoft.ooxml.OOXMLParser.parse(OOXMLParser.java:82)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	a
2
txt
txt
java.lang.OutOfMemoryError: Requested array size exceeds VM limit
	at java.util.Arrays.copyOf(Arrays.java:2367)
	at java.lang.AbstractStringBuilder.expandCapacity(AbstractStringBuilder.java:130)
	at java.lang.AbstractStringBuilder.ensureCapacityInternal(AbstractStringBuilder.java:114)
	at java.lang.AbstractStringBuilder.append(AbstractStringBuilder.java:535)
	at java.lang.StringBuffer.append(StringBuffer.java:322)
	at java.io.StringWriter.write(StringWriter.java:94)
	at org.apache.tika.sax.ToTextContentHandler.characters(ToTextContentHandler.java:92)
	at org.apache.tika.sax.ContentHandlerDecorator.characters(ContentHandlerDecorator.java:146)
	at org.apache.tika.sax.SecureContentHandler.characters(SecureContentHandler.java:270)
	at org.apache.tika.sax.ContentHandlerDecorator.characters(ContentHandlerDecorator.java:146)
	at org.apache.tika.sax.ContentHandlerDecorator.characters(ContentHandlerDecorator.java:146)
	at org.apache.tika.sax.ContentHandlerDecorator.characters(ContentHandlerDecorator.java:146)
	at org.
2
html

org.apache.tika.exception.TikaException: Unexpected RuntimeException from org.apache.tika.parser.microsoft.OfficeParser
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:245)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	a
1
jpg
jpg
org.apache.tika.exception.TikaException: Can't read JPEG metadata
	at org.apache.tika.parser.image.ImageMetadataExtractor.parseJpeg(ImageMetadataExtractor.java:94)
	at org.apache.tika.parser.jpeg.JpegParser.parse(JpegParser.java:56)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.E
1
jpg
jpg
org.apache.tika.exception.TikaException: Unexpected RuntimeException from org.apache.tika.parser.jpeg.JpegParser
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:245)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.
1
pdf
pdf
org.apache.tika.exception.TikaException: TIKA-198: Illegal IOException from org.apache.tika.parser.pdf.PDFParser
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:249)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.
1
rtf
rtf
org.apache.tika.exception.TikaException: Zip bomb detected!
	at org.apache.tika.sax.SecureContentHandler.throwIfCauseOf(SecureContentHandler.java:192)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:124)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1145)
	at java.util.concurrent.ThreadPoolEx
1
txt
txt
java.lang.OutOfMemoryError: Java heap space
	at java.util.Arrays.copyOf(Arrays.java:2367)
	at java.lang.AbstractStringBuilder.expandCapacity(AbstractStringBuilder.java:130)
	at java.lang.AbstractStringBuilder.ensureCapacityInternal(AbstractStringBuilder.java:114)
	at java.lang.AbstractStringBuilder.append(AbstractStringBuilder.java:535)
	at java.lang.StringBuffer.append(StringBuffer.java:322)
	at java.io.StringWriter.write(StringWriter.java:94)
	at org.apache.tika.sax.ToTextContentHandler.characters(ToTextContentHandler.java:92)
	at org.apache.tika.sax.ContentHandlerDecorator.characters(ContentHandlerDecorator.java:146)
	at org.apache.tika.sax.SecureContentHandler.characters(SecureContentHandler.java:270)
	at org.apache.tika.sax.ContentHandlerDecorator.characters(ContentHandlerDecorator.java:146)
	at org.apache.tika.sax.ContentHandlerDecorator.characters(ContentHandlerDecorator.java:146)
	at org.apache.tika.sax.ContentHandlerDecorator.characters(ContentHandlerDecorator.java:146)
	at org.apache.tika.sax.SafeCo
1
txt
txt
java.lang.OutOfMemoryError: Java heap space
	at java.util.Arrays.copyOfRange(Arrays.java:2694)
	at java.lang.String.<init>(String.java:203)
	at java.lang.String.substring(String.java:1913)
	at java.lang.String.trim(String.java:2725)
	at org.apache.tika.parser.RecursiveParserWrapper.addContent(RecursiveParserWrapper.java:246)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:146)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurre
1
xls
xls
org.apache.tika.exception.EncryptedDocumentException: Unable to process: document is encrypted
	at org.apache.tika.parser.microsoft.ExcelExtractor$TikaHSSFListener.processFile(ExcelExtractor.java:301)
	at org.apache.tika.parser.microsoft.ExcelExtractor.parse(ExcelExtractor.java:151)
	at org.apache.tika.parser.microsoft.OfficeParser.parse(OfficeParser.java:207)
	at org.apache.tika.parser.microsoft.OfficeParser.parse(OfficeParser.java:167)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceCons
1
sgml
xml
org.apache.tika.exception.TikaException: XML parse error
	at org.apache.tika.parser.xml.XMLParser.parse(XMLParser.java:78)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
1

zip
org.apache.tika.exception.TikaException: TIKA-198: Illegal IOException from org.apache.tika.parser.pkg.PackageParser
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:249)
	at org.apache.tika.parser.CompositeParser.parse(CompositeParser.java:243)
	at org.apache.tika.parser.AutoDetectParser.parse(AutoDetectParser.java:121)
	at org.apache.tika.parser.RecursiveParserWrapper.parse(RecursiveParserWrapper.java:136)
	at org.apache.tika.batch.fs.RecursiveParserWrapperFSConsumer.processFileResource(RecursiveParserWrapperFSConsumer.java:117)
	at org.apache.tika.batch.FileResourceConsumer._processFileResource(FileResourceConsumer.java:160)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:93)
	at org.apache.tika.batch.FileResourceConsumer.call(FileResourceConsumer.java:38)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471)
	at java.util.concurrent.FutureTask.run(FutureTask.java:262)
	at j
1




select FILE_EXTENSION, DETECTED_FILE_EXTENSION_A, SORT_STACK_TRACE_A, count(1) as COUNT from comparisons where SORT_STACK_TRACE_A is not null group by FILE_EXTENSION, SORT_STACK_TRACE_A order by COUNT desc, DETECTED_FILE_EXTENSION_A LIMIT 50;