import/pdf: Read text from all pages
This commit is contained in:
parent
fe53249bff
commit
5344c5b978
2 changed files with 17 additions and 29 deletions
|
@ -22,12 +22,9 @@ set_cachier_params(
|
|||
)
|
||||
|
||||
|
||||
@cachier()
|
||||
def pdf_lines(filename):
|
||||
reader = PdfReader(filename)
|
||||
return list(
|
||||
line for page in reader.pages for line in page.extract_text().split("\n")
|
||||
)
|
||||
return [line for page in reader.pages for line in page.extract_text().split("\n")]
|
||||
|
||||
|
||||
@cachier()
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue