mirror of
https://gitlab.ub.uni-bielefeld.de/sfb1288inf/ocr.git
synced 2024-12-27 10:44:17 +00:00
Add back german language models
This commit is contained in:
parent
947658a7d8
commit
6db7f70446
@ -68,7 +68,7 @@ RUN wget --no-check-certificate --quiet \
|
|||||||
&& cd - > /dev/null \
|
&& cd - > /dev/null \
|
||||||
&& rm -r "tesseract-${TESSERACT_VERSION}" "${TESSERACT_VERSION}.tar.gz"
|
&& rm -r "tesseract-${TESSERACT_VERSION}" "${TESSERACT_VERSION}.tar.gz"
|
||||||
|
|
||||||
ENV TESSERACT_MODELS="ara,chi_tra,dan,ell,eng,enm,fra,frk,frm,ita,por,rus,spa"
|
ENV TESSERACT_MODELS="ara,chi_tra,dan,deu,ell,eng,enm,fra,frk,frm,ita,por,rus,spa"
|
||||||
ENV TESSDATA_BEST_VERSION=4.1.0
|
ENV TESSDATA_BEST_VERSION=4.1.0
|
||||||
RUN wget --no-check-certificate --quiet \
|
RUN wget --no-check-certificate --quiet \
|
||||||
"https://github.com/tesseract-ocr/tessdata_best/archive/${TESSDATA_BEST_VERSION}.tar.gz" \
|
"https://github.com/tesseract-ocr/tessdata_best/archive/${TESSDATA_BEST_VERSION}.tar.gz" \
|
||||||
|
2
ocr
2
ocr
@ -322,7 +322,7 @@ def parse_args():
|
|||||||
type=int)
|
type=int)
|
||||||
parser.add_argument('--n-cores',
|
parser.add_argument('--n-cores',
|
||||||
default=min(4, multiprocessing.cpu_count()),
|
default=min(4, multiprocessing.cpu_count()),
|
||||||
help='Number of CPU threads to be used', # noqa
|
help='Number of CPU threads to be used',
|
||||||
type=int)
|
type=int)
|
||||||
parser.add_argument('--zip',
|
parser.add_argument('--zip',
|
||||||
help='Create one zip file per filetype')
|
help='Create one zip file per filetype')
|
||||||
|
Loading…
Reference in New Issue
Block a user