mirror of
https://github.com/TheAnachronism/docspell.git
synced 2025-06-21 18:08:25 +00:00
temporary download khmer traineddata before the package being added to registry
This commit is contained in:
@ -33,7 +33,6 @@ RUN apk update && \
|
||||
tesseract-ocr-data-pol \
|
||||
tesseract-ocr-data-est \
|
||||
tesseract-ocr-data-ukr \
|
||||
tesseract-ocr-data-khm \
|
||||
unpaper \
|
||||
weasyprint \
|
||||
libreoffice \
|
||||
@ -70,6 +69,12 @@ RUN wget ${joex_url:-https://github.com/eikek/docspell/releases/download/v$versi
|
||||
ln -snf docspell-joex-* docspell-joex && \
|
||||
rm docspell-joex/conf/docspell-joex.conf
|
||||
|
||||
# temporary download traineddata directly for khmer lang
|
||||
# before tesseract-ocr-data-khm being added to the registry
|
||||
RUN \
|
||||
wget https://github.com/tesseract-ocr/tessdata/raw/main/khm.traineddata && \
|
||||
mv khm.traineddata /usr/share/tessdata
|
||||
|
||||
# Using these data files for japanese, because they work better. See #973
|
||||
RUN \
|
||||
wget https://raw.githubusercontent.com/tesseract-ocr/tessdata_fast/master/jpn_vert.traineddata && \
|
||||
|
Reference in New Issue
Block a user