Author: jnioche
Date: Wed Mar 9 09:04:34 2011
New Revision: 1079705
URL: http://svn.apache.org/viewvc?rev=1079705&view=rev
Log:
TIKA-611 : setSortByPosition reverted to the default value (false) in
PDFTextStripper so that columns are separated
Modified:
tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
Modified:
tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
URL:
http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java?rev=1079705&r1=1079704&r2=1079705&view=diff
==============================================================================
---
tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
(original)
+++
tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
Wed Mar 9 09:04:34 2011
@@ -79,7 +79,7 @@ class PDF2XHTML extends PDFTextStripper
throws IOException {
this.handler = new XHTMLContentHandler(handler, metadata);
setForceParsing(true);
- setSortByPosition(true);
+ setSortByPosition(false);
}
@Override