Skip to content

Commit 5d3b0cd

Browse files
committed
fix error handling when opening corrupted PDFs
1 parent 95646fb commit 5d3b0cd

File tree

1 file changed

+6
-2
lines changed

1 file changed

+6
-2
lines changed

RAGManager/app/services/pdf_processor.py

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -116,8 +116,12 @@ def pdf_to_document(
116116
try:
117117
pdf = pdfplumber.open(io.BytesIO(pdf_bytes))
118118
except Exception as e:
119-
logger.error(f"Failed to open PDF '{object_name}': {e} (possibly corrupted or password-protected)")
120-
return documents
119+
logger.error(
120+
"Failed to open PDF '%s': %s (possibly corrupted or password-protected)",
121+
object_name,
122+
e,
123+
)
124+
raise ValueError(f"Failed to open PDF '{object_name}': {e}") from e
121125

122126
try:
123127
for page_num, page in enumerate(pdf.pages, start=1):

0 commit comments

Comments
 (0)