Add Japanese Vertical Support Branch for Tesseract and Ocrmypdf OCR (#2505)

* Add Japanese Vertical Support 
* Adds Japanese Vertical mappings to default configuration.
This commit is contained in:
tenpai
2024-04-16 18:24:57 +00:00
committed by GitHub
parent 36c00cc9ec
commit e731d822dc
9 changed files with 75 additions and 5 deletions

View File

@ -77,7 +77,7 @@ RUN \
wget https://github.com/tesseract-ocr/tessdata/raw/main/khm.traineddata && \
mv khm.traineddata /usr/share/tessdata
# Using these data files for japanese, because they work better. See #973
# Using these data files for japanese, because they work better. Includes vertical data. See #973 and #2445.
RUN \
wget https://raw.githubusercontent.com/tesseract-ocr/tessdata_fast/master/jpn_vert.traineddata && \
wget https://raw.githubusercontent.com/tesseract-ocr/tessdata_fast/master/jpn.traineddata && \