Merge branch 'TIKA-1508' of https://git-wip-us.apache.org/repos/asf/tika into TIKA-1508
Project: http://git-wip-us.apache.org/repos/asf/tika/repo Commit: http://git-wip-us.apache.org/repos/asf/tika/commit/ea47b716 Tree: http://git-wip-us.apache.org/repos/asf/tika/tree/ea47b716 Diff: http://git-wip-us.apache.org/repos/asf/tika/diff/ea47b716 Branch: refs/heads/master Commit: ea47b716e5a7a1a1637b1cef0dc439b140590711 Parents: 67941a6 a20c46c Author: Thamme Gowda <[email protected]> Authored: Wed Jun 1 20:14:08 2016 -0700 Committer: Thamme Gowda <[email protected]> Committed: Wed Jun 1 20:14:08 2016 -0700 ---------------------------------------------------------------------- CHANGES.txt | 2 + .../org/apache/tika/mime/tika-mimetypes.xml | 9 + .../org/apache/tika/parser/dbf/DBFCell.java | 147 +++++++++++++ .../apache/tika/parser/dbf/DBFColumnHeader.java | 97 +++++++++ .../apache/tika/parser/dbf/DBFFileHeader.java | 144 +++++++++++++ .../org/apache/tika/parser/dbf/DBFParser.java | 155 ++++++++++++++ .../org/apache/tika/parser/dbf/DBFReader.java | 207 +++++++++++++++++++ .../java/org/apache/tika/parser/dbf/DBFRow.java | 62 ++++++ .../apache/tika/parser/geo/topic/GeoParser.java | 14 +- .../tika/parser/html/HtmlEncodingDetector.java | 16 +- .../org/apache/tika/parser/pdf/PDF2XHTML.java | 26 ++- .../services/org.apache.tika.parser.Parser | 3 +- .../apache/tika/parser/dbf/DBFParserTest.java | 158 ++++++++++++++ .../apache/tika/parser/html/HtmlParserTest.java | 22 +- .../apache/tika/parser/pdf/PDFParserTest.java | 18 ++ .../test/resources/test-documents/testDBF.dbf | Bin 0 -> 890 bytes .../test-documents/testDBF_gb18030.dbf | Bin 0 -> 144 bytes 17 files changed, 1061 insertions(+), 19 deletions(-) ----------------------------------------------------------------------
