Skip to content

Commit 2c5a908

Browse files
oolivfharper
authored andcommitted
fix: 🐛 few PDF files are considered blank - using page.get_cdrawings() to fix it
1 parent c0b0e7f commit 2c5a908

File tree

1 file changed

+7
-4
lines changed

1 file changed

+7
-4
lines changed

mindee/inputs.py

Lines changed: 7 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -62,7 +62,7 @@ def __init__(
6262
if count_pages > 3:
6363
self.merge_pdf_pages([0, count_pages - 2, count_pages - 1][:n_pdf_pages])
6464

65-
self.check_if_document_is_empty(count_pages)
65+
self.check_if_document_is_empty()
6666

6767

6868
@staticmethod
@@ -126,9 +126,8 @@ def merge_pdf_pages(self, pages_number):
126126
self.file_object = io.BytesIO(doc.write())
127127

128128

129-
def check_if_document_is_empty(self, pages_number):
129+
def check_if_document_is_empty(self):
130130
"""
131-
:param pages_number: List of pages number to use for merging in the original pdf
132131
:return: (void) Check if the document contain only empty pages
133132
"""
134133

@@ -139,6 +138,10 @@ def check_if_document_is_empty(self, pages_number):
139138
)
140139
fitz.open()
141140
for page in src:
142-
if len(page.getImageList()) > 0 or page.getText():
141+
if (
142+
len(page.get_images()) > 0
143+
or len(page.get_cdrawings()) > 0
144+
or len(page.get_text()) > 0
145+
):
143146
return
144147
raise Exception("PDF pages are empty")

0 commit comments

Comments
 (0)