Author: jukka
Date: Fri Oct 16 15:32:23 2009
New Revision: 825942
URL: http://svn.apache.org/viewvc?rev=825942&view=rev
Log:
TIKA-302: patch: initial support for ePUB
Add the EPUB parser to the default Tika configuration.
Modified:
lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/tika-config.xml
lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/AutoDetectParserTest.java
Modified:
lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/tika-config.xml
URL:
http://svn.apache.org/viewvc/lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/tika-config.xml?rev=825942&r1=825941&r2=825942&view=diff
==============================================================================
---
lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/tika-config.xml
(original)
+++
lucene/tika/trunk/tika-core/src/main/resources/org/apache/tika/tika-config.xml
Fri Oct 16 15:32:23 2009
@@ -164,6 +164,10 @@
<mime>application/mbox</mime>
</parser>
+ <parser name="parse-epub"
class="org.apache.tika.parser.epub.EpubParser">
+ <mime>application/epub+zip</mime>
+ </parser>
+
</parsers>
</properties>
\ No newline at end of file
Modified:
lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/AutoDetectParserTest.java
URL:
http://svn.apache.org/viewvc/lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/AutoDetectParserTest.java?rev=825942&r1=825941&r2=825942&view=diff
==============================================================================
---
lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/AutoDetectParserTest.java
(original)
+++
lucene/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/AutoDetectParserTest.java
Fri Oct 16 15:32:23 2009
@@ -125,7 +125,8 @@
public void testEpub() throws Exception {
assertAutoDetect(
- "testEPUB.epub", "application/epub+zip", "");
+ "testEPUB.epub", "application/epub+zip",
+ "The previous headings were subchapters");
}
public void testExcel() throws Exception {