We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 42b83d2 commit 3706c1eCopy full SHA for 3706c1e
1 file changed
mindee/input/local_input_source.py
@@ -52,9 +52,16 @@ def __init__(self) -> None:
52
self._check_mimetype()
53
if self.is_pdf():
54
self.file_object.seek(0)
55
+ # Some broken (yet fixable) PDFs can cause pdfium to crash on open.
56
if PYPDFIUM2_AVAILABLE:
- pdf = pdfium.PdfDocument(self.file_object)
57
- self.page_count = len(pdf)
+ try:
58
+ pdf = pdfium.PdfDocument(self.file_object)
59
+ self.page_count = len(pdf)
60
+ except pdfium.PdfiumError as e:
61
+ logger.warning(
62
+ "Could not open PDF file: %s due to %s", self.filename, e
63
+ )
64
+ self.page_count = 0
65
66
else:
67
self.page_count = 0
0 commit comments