From 42e8bf67e27f5f25096027543dc4af797c0273c4 Mon Sep 17 00:00:00 2001 From: "Gerber, Mike" Date: Mon, 30 Nov 2020 17:52:24 +0100 Subject: [PATCH] =?UTF-8?q?=F0=9F=9A=A7=20Add=20a.=20our=20augmented=20GT4?= =?UTF-8?q?HistOCR=20Calamari=20model=20b.=20chreul's=20GT4HistOCR=20model?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- Dockerfile-ocrd_calamari | 4 +++- build | 2 ++ data | 2 +- 3 files changed, 6 insertions(+), 2 deletions(-) diff --git a/Dockerfile-ocrd_calamari b/Dockerfile-ocrd_calamari index 186c8b7..64d2e62 100644 --- a/Dockerfile-ocrd_calamari +++ b/Dockerfile-ocrd_calamari @@ -14,7 +14,9 @@ RUN ${PIP_INSTALL} \ # Copy OCR models RUN mkdir -p /var/lib/calamari-models/GT4HistOCR COPY data/calamari-models/GT4HistOCR/2019-12-11T11_10+0100 /var/lib/calamari-models/GT4HistOCR/2019-12-11T11_10+0100 - +# XXX experimental +COPY data/calamari-models/GT4HistOCR/2019-12-18T17_24+0100-with-augmentation-UNTESTED /var/lib/calamari-models/GT4HistOCR/2019-12-18T17_24+0100 +COPY data/mirror/github.com/Calamari-OCR/calamari_models/gt4histocr /var/lib/calamari-models/GT4HistOCR-chreul # Check pip dependencies diff --git a/build b/build index c670633..f0a37d3 100755 --- a/build +++ b/build @@ -8,6 +8,8 @@ DATA_SUBDIR=data get_from_annex() { annex_get 'calamari-models/GT4HistOCR/2019-07-22T15_49+0200/*.ckpt*' annex_get 'calamari-models/GT4HistOCR/2019-12-11T11_10+0100/*.ckpt*' + annex_get 'calamari-models/GT4HistOCR/2019-12-18T17_24+0100*/*.ckpt*' + annex_get 'mirror/github.com/Calamari-OCR/calamari_models/gt4histocr/*.ckpt*' annex_get 'tesseract-models/GT4HistOCR/*.traineddata' annex_get 'textline_detection/*.h5' annex_get 'mirror/github.com/tesseract-ocr/tessdata_best/archive/4.0.0-repacked.tar.gz' diff --git a/data b/data index bd1628e..3fbdbcf 160000 --- a/data +++ b/data @@ -1 +1 @@ -Subproject commit bd1628e1aefbb0766655ee3726b4b0234d20a4f1 +Subproject commit 3fbdbcf368f05ea76253d6d3327644c4d755d6f8