fix: ensure PdfReader is closed (#8636)

This commit is contained in:
Steve Roudebush 2025-06-20 10:00:18 -05:00 committed by GitHub
commit 5d0abf424c
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -130,8 +130,7 @@ def read_docx_file(file_path: str) -> str:
def parse_pdf_to_text(file_path: str) -> str:
from pypdf import PdfReader
with Path(file_path).open("rb") as f:
reader = PdfReader(f)
with Path(file_path).open("rb") as f, PdfReader(f) as reader:
return "\n\n".join([page.extract_text() for page in reader.pages])