Author: jukka
Date: Fri Oct 16 13:18:45 2009
New Revision: 825880

URL: http://svn.apache.org/viewvc?rev=825880&view=rev
Log:
TIKA-309: Mime type application/rdf+xml not correctly detected

Added:
    lucene/tika/trunk/tika-parsers/src/test/resources/test-documents/testRDF.rdf
Modified:
    
lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
    
lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/mime/TestMimeTypes.java
    
lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/AutoDetectParserTest.java

Modified: 
lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
URL: 
http://svn.apache.org/viewvc/lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml?rev=825880&r1=825879&r2=825880&view=diff
==============================================================================
--- 
lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
 (original)
+++ 
lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
 Fri Oct 16 13:18:45 2009
@@ -355,9 +355,16 @@
   <mime-type type="application/prs.nprend"/>
   <mime-type type="application/prs.plucker"/>
   <mime-type type="application/qsig"/>
+
   <mime-type type="application/rdf+xml">
+    <acronym>RDF/XML</acronym>
+    <comment>XML syntax for RDF graphs</comment>
+    <glob pattern="*.owl"/>
     <glob pattern="*.rdf"/>
+    <root-XML localName="RDF"
+              namespaceURI="http://www.w3.org/1999/02/22-rdf-syntax-ns#"/>
   </mime-type>
+
   <mime-type type="application/reginfo+xml">
     <glob pattern="*.rif"/>
   </mime-type>

Modified: 
lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/mime/TestMimeTypes.java
URL: 
http://svn.apache.org/viewvc/lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/mime/TestMimeTypes.java?rev=825880&r1=825879&r2=825880&view=diff
==============================================================================
--- 
lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/mime/TestMimeTypes.java
 (original)
+++ 
lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/mime/TestMimeTypes.java
 Fri Oct 16 13:18:45 2009
@@ -191,6 +191,11 @@
         assertTypeByName("image/cgm", "x.CGM");
     }
 
+    public void testRdfXmlDetection() throws Exception {
+        assertTypeByName("application/rdf+xml", "x.rdf");
+        assertTypeByName("application/rdf+xml", "x.owl");
+    }
+
     public void testSvgDetection() throws Exception {
         assertType("image/svg+xml", "testSVG.svg");
         assertTypeByData("image/svg+xml", "testSVG.svg");

Modified: 
lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/AutoDetectParserTest.java
URL: 
http://svn.apache.org/viewvc/lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/AutoDetectParserTest.java?rev=825880&r1=825879&r2=825880&view=diff
==============================================================================
--- 
lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/AutoDetectParserTest.java
 (original)
+++ 
lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/AutoDetectParserTest.java
 Fri Oct 16 13:18:45 2009
@@ -114,13 +114,13 @@
         assertAutoDetect(resource, resource, type, wrongMimeType, content);
 
         assertAutoDetect(resource, null, type, type,          content);
-//        assertAutoDetect(resource, null, type, null,          content);
-//        assertAutoDetect(resource, null, type, wrongMimeType, content);
+        assertAutoDetect(resource, null, type, null,          content);
+        assertAutoDetect(resource, null, type, wrongMimeType, content);
 
-//        final String badResource = "a.xyz";
-//        assertAutoDetect(resource, badResource, type, type,          
content);
-//        assertAutoDetect(resource, badResource, type, null,          
content);
-//        assertAutoDetect(resource, badResource, type, wrongMimeType, 
content);
+        final String badResource = "a.xyz";
+        assertAutoDetect(resource, badResource, type, type,          content);
+        assertAutoDetect(resource, badResource, type, null,          content);
+        assertAutoDetect(resource, badResource, type, wrongMimeType, content);
     }
 
 
@@ -146,6 +146,10 @@
         assertAutoDetect("testPPT.ppt", POWERPOINT, "Sample Powerpoint Slide");
     }
 
+    public void testRdfXml() throws Exception {
+        assertAutoDetect("testRDF.rdf", "application/rdf+xml", "");
+    }
+
     public void testRTF() throws Exception {
         assertAutoDetect("testRTF.rtf", RTF, "indexation Word");
     }
@@ -229,7 +233,7 @@
                 + "  resourceStatedName      = " + resourceStatedName + "\n"
                 + "  realType                = " + realType + "\n"
                 + "  statedType              = " + statedType + "\n"
-                + "  expectedContentFragment = " + realType + "\n";
+                + "  expectedContentFragment = " + expectedContentFragment + 
"\n";
         }
     }
 }

Added: 
lucene/tika/trunk/tika-parsers/src/test/resources/test-documents/testRDF.rdf
URL: 
http://svn.apache.org/viewvc/lucene/tika/trunk/tika-parsers/src/test/resources/test-documents/testRDF.rdf?rev=825880&view=auto
==============================================================================
--- 
lucene/tika/trunk/tika-parsers/src/test/resources/test-documents/testRDF.rdf 
(added)
+++ 
lucene/tika/trunk/tika-parsers/src/test/resources/test-documents/testRDF.rdf 
Fri Oct 16 13:18:45 2009
@@ -0,0 +1,23 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements.  See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License.  You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#";
+         xmlns:dc="http://purl.org/dc/elements/1.1/";>
+  <rdf:Description
+      rdf:about="http://lucene.apache.org/tika/";
+      dc:title="Apache Tika"/>
+</rdf:RDF>


Reply via email to