Author: jukka
Date: Fri Mar 19 13:50:22 2010
New Revision: 925217
URL: http://svn.apache.org/viewvc?rev=925217&view=rev
Log:
TIKA-388: Don't trust streams that claim mark support
Modified:
lucene/tika/trunk/tika-core/src/main/java/org/apache/tika/parser/AutoDetectParser.java
Modified:
lucene/tika/trunk/tika-core/src/main/java/org/apache/tika/parser/AutoDetectParser.java
URL:
http://svn.apache.org/viewvc/lucene/tika/trunk/tika-core/src/main/java/org/apache/tika/parser/AutoDetectParser.java?rev=925217&r1=925216&r2=925217&view=diff
==============================================================================
---
lucene/tika/trunk/tika-core/src/main/java/org/apache/tika/parser/AutoDetectParser.java
(original)
+++
lucene/tika/trunk/tika-core/src/main/java/org/apache/tika/parser/AutoDetectParser.java
Fri Mar 19 13:50:22 2010
@@ -83,10 +83,8 @@ public class AutoDetectParser extends Co
InputStream stream, ContentHandler handler,
Metadata metadata, ParseContext context)
throws IOException, SAXException, TikaException {
- // We need buffering to enable MIME magic detection before parsing
- if (!stream.markSupported()) {
- stream = new BufferedInputStream(stream);
- }
+ // We need (reliable!) mark support for type detection before parsing
+ stream = new BufferedInputStream(stream);
// Automatically detect the MIME type of the document
MediaType type = detector.detect(stream, metadata);