From 28bb482cebb4c8f1bd9f373725760b803efb09dd Mon Sep 17 00:00:00 2001 From: "Gerber, Mike" Date: Mon, 10 Feb 2020 19:26:04 +0100 Subject: [PATCH] =?UTF-8?q?=E2=9C=A8=20Produce=20word=20results?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- my_ocrd_workflow | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/my_ocrd_workflow b/my_ocrd_workflow index 6234d33..ca3907f 100755 --- a/my_ocrd_workflow +++ b/my_ocrd_workflow @@ -68,7 +68,8 @@ do_ocr() { # Perform OCR on the segmented lines ocrd_tesserocr_recognize_parameters='{ - "model": "GT4HistOCR_2000000" + "model": "GT4HistOCR_2000000", + "textequiv_level": "word" }' ocrd workspace remove-group -rf OCR-D-OCR-TESS ocrd-tesserocr-recognize -I OCR-D-SEG-LINE -O OCR-D-OCR-TESS -p "$ocrd_tesserocr_recognize_parameters" @@ -79,7 +80,7 @@ do_ocr_calamari() { ocrd_calamari_recognize_parameters='{ "checkpoint": "/var/lib/calamari-models/GT4HistOCR/2019-07-22T15:49+0200/*.ckpt.json", - "textequiv_level": "line" + "textequiv_level": "word" }' ocrd workspace remove-group -rf OCR-D-OCR-CALAMARI ocrd-calamari-recognize -I OCR-D-SEG-LINE -O OCR-D-OCR-CALAMARI -p "$ocrd_calamari_recognize_parameters"