Repository: tika Updated Branches: refs/heads/2.x b3bf5141b -> 73ce7681c
TIKA-2009 -- add magic for djvu Project: http://git-wip-us.apache.org/repos/asf/tika/repo Commit: http://git-wip-us.apache.org/repos/asf/tika/commit/73ce7681 Tree: http://git-wip-us.apache.org/repos/asf/tika/tree/73ce7681 Diff: http://git-wip-us.apache.org/repos/asf/tika/diff/73ce7681 Branch: refs/heads/2.x Commit: 73ce7681c36029f91369cb533c5c78c1b96bb6dd Parents: b3bf514 Author: tballison <[email protected]> Authored: Wed Jun 15 10:11:30 2016 -0400 Committer: tballison <[email protected]> Committed: Wed Jun 15 10:11:30 2016 -0400 ---------------------------------------------------------------------- CHANGES.txt | 2 ++ .../test/java/org/apache/tika/mime/TestMimeTypes.java | 6 ++++++ .../resources/org/apache/tika/mime/tika-mimetypes.xml | 3 +++ .../src/test/resources/test-documents/testDJVU.djvu | Bin 0 -> 89 bytes 4 files changed, 11 insertions(+) ---------------------------------------------------------------------- http://git-wip-us.apache.org/repos/asf/tika/blob/73ce7681/CHANGES.txt ---------------------------------------------------------------------- diff --git a/CHANGES.txt b/CHANGES.txt index 81243fe..8984c90 100644 --- a/CHANGES.txt +++ b/CHANGES.txt @@ -10,6 +10,8 @@ Release 2.0 - Future Development Release 1.14 - ??? + * Add mime magic for DJVU files (TIKA-2009). + * Add mime definition and parser for MS Owner File (TIKA-2008). * Add mime definition for Windows Media Metafile (TIKA-2004). http://git-wip-us.apache.org/repos/asf/tika/blob/73ce7681/tika-app/src/test/java/org/apache/tika/mime/TestMimeTypes.java ---------------------------------------------------------------------- diff --git a/tika-app/src/test/java/org/apache/tika/mime/TestMimeTypes.java b/tika-app/src/test/java/org/apache/tika/mime/TestMimeTypes.java index d27c714..683b657 100644 --- a/tika-app/src/test/java/org/apache/tika/mime/TestMimeTypes.java +++ b/tika-app/src/test/java/org/apache/tika/mime/TestMimeTypes.java @@ -986,6 +986,12 @@ public class TestMimeTypes extends TikaTest { assertType("application/x-ms-owner", "testMSOwnerFile"); } + @Test + public void testDJVU() throws Exception { + assertType("image/vnd.djvu", "testDJVU.djvu"); + assertTypeByData("image/vnd.djvu", "testDJVU.djvu"); + } + private void assertText(byte[] prefix) throws IOException { assertMagic("text/plain", prefix); } http://git-wip-us.apache.org/repos/asf/tika/blob/73ce7681/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml ---------------------------------------------------------------------- diff --git a/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml b/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml index 9ec8d76..0f0ea86 100644 --- a/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml +++ b/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml @@ -4796,6 +4796,9 @@ <mime-type type="image/vnd.djvu"> <glob pattern="*.djvu"/> <glob pattern="*.djv"/> + <magic priority="50"> + <match value="AT&TFORM" type="string" offset="0"/> + </magic> </mime-type> <mime-type type="image/vnd.dwg"> http://git-wip-us.apache.org/repos/asf/tika/blob/73ce7681/tika-test-resources/src/test/resources/test-documents/testDJVU.djvu ---------------------------------------------------------------------- diff --git a/tika-test-resources/src/test/resources/test-documents/testDJVU.djvu b/tika-test-resources/src/test/resources/test-documents/testDJVU.djvu new file mode 100644 index 0000000..1361d18 Binary files /dev/null and b/tika-test-resources/src/test/resources/test-documents/testDJVU.djvu differ
