Author: mattmann
Date: Wed Nov 25 23:41:10 2009
New Revision: 884340
URL: http://svn.apache.org/viewvc?rev=884340&view=rev
Log:
- fix for TIKA-336 More issues with RDF mime detection
Modified:
lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
lucene/tika/trunk/tika-core/src/test/resources/org/apache/tika/mime/test-difficult-rdf2.xml
Modified:
lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
URL:
http://svn.apache.org/viewvc/lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml?rev=884340&r1=884339&r2=884340&view=diff
==============================================================================
---
lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
(original)
+++
lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
Wed Nov 25 23:41:10 2009
@@ -2649,6 +2649,7 @@
<magic priority="50">
<match value="<?xml" type="string" offset="0"/>
<match value="<?XML" type="string" offset="0"/>
+ <match value="<!--" type="string" offset="0"/>
<match value="0xFFFE3C003F0078006D006C00" type="string" offset="0"/>
<match value="0xFEFF003C003F0078006D006C" type="string" offset="0"/>
<!-- TODO: Add matches for the other possible XML encoding schemes -->
Modified:
lucene/tika/trunk/tika-core/src/test/resources/org/apache/tika/mime/test-difficult-rdf2.xml
URL:
http://svn.apache.org/viewvc/lucene/tika/trunk/tika-core/src/test/resources/org/apache/tika/mime/test-difficult-rdf2.xml?rev=884340&r1=884339&r2=884340&view=diff
==============================================================================
---
lucene/tika/trunk/tika-core/src/test/resources/org/apache/tika/mime/test-difficult-rdf2.xml
(original)
+++
lucene/tika/trunk/tika-core/src/test/resources/org/apache/tika/mime/test-difficult-rdf2.xml
Wed Nov 25 23:41:10 2009
@@ -1,5 +1,3 @@
-<?xml version='1.0' encoding='ISO-8859-1'?>
-
<!-- This is the OWL 2 Namespace Document, sometimes
called the "owl.owl" file.