diff --git a/Dockerfile b/Dockerfile index 4e020ce..697e5b2 100644 --- a/Dockerfile +++ b/Dockerfile @@ -54,6 +54,8 @@ RUN echo "deb https://notesalexp.org/tesseract-ocr/stretch/ stretch main" >> /et wget -nv https://github.com/tesseract-ocr/tessdata_best/raw/master/spa.traineddata -P /usr/share/tesseract-ocr/4.00/tessdata && \ wget -nv https://github.com/tesseract-ocr/tessdata_best/raw/master/frm.traineddata -P /usr/share/tesseract-ocr/4.00/tessdata +RUN mkdir files_for_ocr files_from_ocr + COPY ocr_pyflow /usr/local/bin COPY parse_hocr /usr/local/bin