diff --git a/Dockerfile-ocrd_tesserocr b/Dockerfile-ocrd_tesserocr index 30a6609..b9aca74 100644 --- a/Dockerfile-ocrd_tesserocr +++ b/Dockerfile-ocrd_tesserocr @@ -24,7 +24,7 @@ COPY data/tesseract-models/GT4HistOCR/GT4HistOCR_2000000.traineddata $TESSDATA_P # Build pip installable stuff RUN ${PIP_INSTALL} \ # Now the real stuff: - 'ocrd_tesserocr >= 0.9.0' + 'ocrd_tesserocr >= 0.9.5' # Check pip dependencies diff --git a/build b/build index 7bfd60c..dcc1f20 100755 --- a/build +++ b/build @@ -15,7 +15,7 @@ get_from_annex() { } get_from_web() { download_to 'https://qurator-data.de/calamari-models/GT4HistOCR/model.tar.xz' 'calamari-models/GT4HistOCR/2019-07-22T15_49+0200' - # XXX Calamari 1 model + download_to 'https://qurator-data.de/calamari-models/GT4HistOCR/2019-12-11T11_10+0100/model.tar.xz' 'calamari-models/GT4HistOCR/2019-12-11T11_10+0100' download_to 'https://qurator-data.de/tesseract-models/GT4HistOCR/models.tar' 'tesseract-models/GT4HistOCR' download_to 'https://qurator-data.de/sbb_textline_detector/models.tar.gz' 'textline_detection' download_to --strip-components 1 'https://qurator-data.de/sbb_binarization/models.tar.gz' 'sbb_binarization'