mirror of
https://github.com/paperless-ngx/paperless-ngx.git
synced 2025-12-06 06:45:05 +01:00
Fixes how a language code like chi-sim is treated in the checks
This commit is contained in:
parent
2140d42098
commit
f0497e7744
1 changed files with 10 additions and 3 deletions
|
|
@ -1,3 +1,4 @@
|
|||
import shutil
|
||||
import subprocess
|
||||
|
||||
from django.conf import settings
|
||||
|
|
@ -7,10 +8,16 @@ from django.core.checks import Warning
|
|||
|
||||
|
||||
def get_tesseract_langs():
|
||||
with subprocess.Popen(["tesseract", "--list-langs"], stdout=subprocess.PIPE) as p:
|
||||
stdout, stderr = p.communicate()
|
||||
proc = subprocess.run(
|
||||
[shutil.which("tesseract"), "--list-langs"],
|
||||
capture_output=True,
|
||||
)
|
||||
|
||||
return stdout.decode().strip().split("\n")[1:]
|
||||
# Decode bytes to string, split on newlines, trim out the header
|
||||
proc_lines = proc.stdout.decode("utf8", errors="ignore").strip().split("\n")[1:]
|
||||
|
||||
# Replace _ with - to convert two part languages to the expected code
|
||||
return [x.replace("_", "-") for x in proc_lines]
|
||||
|
||||
|
||||
@register()
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue