Author: tilman
Date: Tue Jan 13 11:46:49 2026
New Revision: 1931289

Log:
PDFBOX-6145: move content check after page number check so that not all pages 
get checked

Modified:
   pdfbox/trunk/pdfbox/src/main/java/org/apache/pdfbox/text/PDFTextStripper.java

Modified: 
pdfbox/trunk/pdfbox/src/main/java/org/apache/pdfbox/text/PDFTextStripper.java
==============================================================================
--- 
pdfbox/trunk/pdfbox/src/main/java/org/apache/pdfbox/text/PDFTextStripper.java   
    Tue Jan 13 11:46:45 2026        (r1931288)
+++ 
pdfbox/trunk/pdfbox/src/main/java/org/apache/pdfbox/text/PDFTextStripper.java   
    Tue Jan 13 11:46:49 2026        (r1931289)
@@ -298,10 +298,7 @@ public class PDFTextStripper extends Leg
 
         for (PDPage page : pages)
         {
-            if (page.hasContents())
-            {
-                processPage(page);
-            }
+            processPage(page);
             currentPageNo++;
         }
     }
@@ -343,6 +340,10 @@ public class PDFTextStripper extends Leg
                 && (startBookmarkPageNumber == -1 || currentPageNo >= 
startBookmarkPageNumber)
                 && (endBookmarkPageNumber == -1 || currentPageNo <= 
endBookmarkPageNumber))
         {
+            if (!page.hasContents())
+            {
+                return;
+            }
             startPage(page);
 
             int numberOfArticleSections = 1;

Reply via email to