ARG GIT_COMMIT="latest" FROM quratorspk/ocrd-galley-core:$GIT_COMMIT ARG PIP_INSTALL="pip install --no-cache-dir" ARG TESSDATA_BEST_VERSION="4.0.0" #XXX ARG OCRD_TESSEROCR_VERSION="0.16.0" ENV TESSDATA_PREFIX /usr/local/share/tessdata # Install Leptonica and Tesseract. RUN add-apt-repository ppa:alex-p/tesseract-ocr && \ apt-get update && \ apt-get install -y \ tesseract-ocr \ libtesseract-dev \ && \ apt-get clean && rm -rf /var/lib/apt/lists/* # Build pip installable stuff RUN ${PIP_INSTALL} \ # "ocrd_tesserocr == ${OCRD_TESSEROCR_VERSION}" # XXX use official release again git+https://github.com/OCR-D/ocrd_tesserocr.git@refs/pull/191/merge # Check pip dependencies RUN pip check # Default command CMD ["ocrd-tesserocr-recognize"]