mirror of
https://github.com/paperless-ngx/paperless-ngx.git
synced 2025-12-06 23:05:42 +01:00
Updated the docstring to show what's actually happening
This commit is contained in:
parent
5b479c5058
commit
10a0556951
1 changed files with 5 additions and 6 deletions
|
|
@ -21,12 +21,11 @@ from documents.models import Document
|
||||||
class Command(BaseCommand):
|
class Command(BaseCommand):
|
||||||
"""
|
"""
|
||||||
Loop over every file found in CONSUMPTION_DIR and:
|
Loop over every file found in CONSUMPTION_DIR and:
|
||||||
1. Convert it to a greyscale tif
|
1. Convert it to a greyscale png
|
||||||
2. Convert it to a full-colour jpg
|
2. Use tesseract on the png
|
||||||
3. Use tesseract on the tif
|
3. Encrypt and store the PDF in the MEDIA_ROOT
|
||||||
4. Store the OCR'd text in the database along with the paths to the jpg
|
4. Store the OCR'd text in the database
|
||||||
and original pdf
|
5. Delete the pdf and image(s)
|
||||||
5. Delete the pdf and images
|
|
||||||
"""
|
"""
|
||||||
|
|
||||||
LOOP_TIME = 10 # Seconds
|
LOOP_TIME = 10 # Seconds
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue