import/pdf: Read text from all pages

This commit is contained in:
polyfloyd 2025-06-29 23:53:21 +02:00
parent fe53249bff
commit 5344c5b978
2 changed files with 17 additions and 29 deletions

View file

@ -22,12 +22,9 @@ set_cachier_params(
)
@cachier()
def pdf_lines(filename):
reader = PdfReader(filename)
return list(
line for page in reader.pages for line in page.extract_text().split("\n")
)
return [line for page in reader.pages for line in page.extract_text().split("\n")]
@cachier()