mirror of
https://github.com/paperless-ngx/paperless-ngx.git
synced 2025-12-08 07:45:32 +01:00
fixes #794
This commit is contained in:
parent
27cb243a2f
commit
d26c46e034
1 changed files with 2 additions and 0 deletions
|
|
@ -119,6 +119,8 @@ class RasterisedDocumentParser(DocumentParser):
|
|||
try:
|
||||
text = extract_text(pdf_file)
|
||||
stripped = strip_excess_whitespace(text)
|
||||
stripped = stripped.replace("\0", " ")
|
||||
|
||||
self.log("debug", f"Extracted text from PDF file {pdf_file}")
|
||||
return stripped
|
||||
except PDFException:
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue