Author: nick
Date: Tue Jun  2 11:00:22 2015
New Revision: 1683076

URL: http://svn.apache.org/r1683076
Log:
Try to make the low-priority padded PDF magic match more specific, as it looks 
to have incorrectly triggered on a few of the govdocs text files

Modified:
    
tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml

Modified: 
tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
URL: 
http://svn.apache.org/viewvc/tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml?rev=1683076&r1=1683075&r2=1683076&view=diff
==============================================================================
--- 
tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml 
(original)
+++ 
tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml 
Tue Jun  2 11:00:22 2015
@@ -489,7 +489,8 @@
     <magic priority="20">
       <!-- Low priority match for %PDF near the start of the file -->
       <!-- Can trigger false positives, so set the priority rather low here -->
-      <match value="%PDF-" type="string" offset="1:512"/>
+      <match value="%PDF-1." type="string" offset="1:512"/>
+      <match value="%PDF-2." type="string" offset="1:512"/>
     </magic>
     <glob pattern="*.pdf"/>
   </mime-type>


Reply via email to