Add OCR step

This commit is contained in:
Gerber, Mike 2019-06-19 13:02:54 +02:00
parent a64b9cf5c8
commit 9bd3853c78

View file

@ -38,9 +38,18 @@ do_linesegmentation() {
#ocrd workspace validate mets.xml
}
do_ocr() {
ocrd_tesserocr_recognize_parameters='{ "model": "eng" }' # TODO mods:language + fontident → model
remove_filegrp OCR-D-OCR-TESS mets.xml
ocrd-tesserocr-recognize -l DEBUG \
-m mets.xml -I OCR-D-SEG-LINE -O OCR-D-OCR-TESS \
-p <(echo $ocrd_tesserocr_recognize_parameters)
#ocrd workspace validate mets.xml
}
do_fontident
do_linesegmentation
do_ocr
# XXX Multiple calls create multiple identical mets:agent elements