Author: tilman Date: Fri Jul 11 10:14:57 2025 New Revision: 1927131 URL: http://svn.apache.org/viewvc?rev=1927131&view=rev Log: PDFBOX-5660: avoid default encoding
Modified: pdfbox/branches/2.0/pdfbox/src/main/java/org/apache/pdfbox/pdfparser/PDFStreamParser.java Modified: pdfbox/branches/2.0/pdfbox/src/main/java/org/apache/pdfbox/pdfparser/PDFStreamParser.java URL: http://svn.apache.org/viewvc/pdfbox/branches/2.0/pdfbox/src/main/java/org/apache/pdfbox/pdfparser/PDFStreamParser.java?rev=1927131&r1=1927130&r2=1927131&view=diff ============================================================================== --- pdfbox/branches/2.0/pdfbox/src/main/java/org/apache/pdfbox/pdfparser/PDFStreamParser.java (original) +++ pdfbox/branches/2.0/pdfbox/src/main/java/org/apache/pdfbox/pdfparser/PDFStreamParser.java Fri Jul 11 10:14:57 2025 @@ -34,6 +34,7 @@ import org.apache.pdfbox.cos.COSNumber; import org.apache.pdfbox.cos.COSStream; import org.apache.pdfbox.io.RandomAccessBuffer; import org.apache.pdfbox.pdmodel.common.PDStream; +import org.apache.pdfbox.util.Charsets; /** * This will parse a PDF byte stream and extract operands and such. @@ -403,7 +404,7 @@ public class PDFStreamParser extends Bas { // usually, the operator here is Q, sometimes EMC (PDFBOX-2376), S (PDFBOX-3784), // or a number (PDFBOX-5957) - s = new String(binCharTestArr, startOpIdx, endOpIdx - startOpIdx); + s = new String(binCharTestArr, startOpIdx, endOpIdx - startOpIdx, Charsets.US_ASCII); if (!"Q".equals(s) && !"EMC".equals(s) && !"S".equals(s) && !s.matches("^\\d*\\.?\\d*$")) { @@ -418,7 +419,7 @@ public class PDFStreamParser extends Bas if (endOpIdx == -1) { endOpIdx = MAX_BIN_CHAR_TEST_LENGTH; - s = new String(binCharTestArr, startOpIdx, endOpIdx - startOpIdx); + s = new String(binCharTestArr, startOpIdx, endOpIdx - startOpIdx, Charsets.US_ASCII); } // look for token of 3 chars max or a number if (endOpIdx - startOpIdx > 3 && !s.matches("^\\d*\\.?\\d*$"))