From e196a70ea5eee7834f658abc50dda4d44c1c2a5a Mon Sep 17 00:00:00 2001 From: "Gerber, Mike" Date: Wed, 21 Apr 2021 11:35:29 +0200 Subject: [PATCH] =?UTF-8?q?=F0=9F=9A=A7=20ocrd-galley:=20Add=20model=20fil?= =?UTF-8?q?es=20for=20eynollah?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- Dockerfile-eynollah | 2 +- build | 2 ++ build-tmp-XXX | 1 + data | 2 +- 4 files changed, 5 insertions(+), 2 deletions(-) diff --git a/Dockerfile-eynollah b/Dockerfile-eynollah index f1f1e02..8ee7968 100644 --- a/Dockerfile-eynollah +++ b/Dockerfile-eynollah @@ -11,7 +11,7 @@ RUN ${PIP_INSTALL} \ # Copy OCR models -# XXX +COPY data/eynollah /var/lib/eynollah # Check pip dependencies diff --git a/build b/build index f42cd5f..a1e36f9 100755 --- a/build +++ b/build @@ -14,6 +14,7 @@ get_from_annex() { annex_get 'textline_detection/*.h5' annex_get 'mirror/github.com/tesseract-ocr/tessdata_best/archive/4.0.0-repacked.tar.gz' annex_get 'sbb_binarization/2021-03-09/*.h5' + annex_get 'eynollah/*.h5' } get_from_web() { download_to 'https://qurator-data.de/calamari-models/GT4HistOCR/model.tar.xz' 'calamari-models/GT4HistOCR/2019-07-22T15_49+0200' @@ -22,6 +23,7 @@ get_from_web() { download_to 'https://qurator-data.de/sbb_textline_detector/models.tar.gz' 'textline_detection' download_to --strip-components 1 'https://qurator-data.de/sbb_binarization/2021-03-09/models.tar.gz' 'sbb_binarization/2021-03-09' download_to --no-unpack 'https://qurator-data.de/mirror/github.com/tesseract-ocr/tessdata_best/archive/4.0.0-repacked.tar.gz' 'mirror/github.com/tesseract-ocr/tessdata_best/archive/4.0.0-repacked.tar.gz' + download_to --strip-components 1 'https://qurator-data.de/eynollah/models_eynollah.tar.gz' 'eynollah' } . $self_dir/qurator_data_lib.sh handle_data diff --git a/build-tmp-XXX b/build-tmp-XXX index 52dfeb4..0072aa3 100755 --- a/build-tmp-XXX +++ b/build-tmp-XXX @@ -12,6 +12,7 @@ get_from_web() { download_to 'https://qurator-data.de/sbb_textline_detector/models.tar.gz' 'textline_detection' download_to --strip-components 1 'https://qurator-data.de/sbb_binarization/2021-03-09/models.tar.gz' 'sbb_binarization/2021-03-09' download_to --no-unpack 'https://qurator-data.de/mirror/github.com/tesseract-ocr/tessdata_best/archive/4.0.0-repacked.tar.gz' 'mirror/github.com/tesseract-ocr/tessdata_best/archive/4.0.0-repacked.tar.gz' + download_to --strip-components 1 'https://qurator-data.de/eynollah/models_eynollah.tar.gz' 'eynollah' } . $self_dir/qurator_data_lib.sh handle_data diff --git a/data b/data index c67004e..7244786 160000 --- a/data +++ b/data @@ -1 +1 @@ -Subproject commit c67004ecfff404409a6c47b53088e8b7efadc85f +Subproject commit 7244786435c10f562f4ba40e27a39ab808eee977