mirror of
https://github.com/qurator-spk/ocrd-galley.git
synced 2025-06-08 22:29:56 +02:00
Add OCR step
This commit is contained in:
parent
a64b9cf5c8
commit
9bd3853c78
1 changed files with 9 additions and 0 deletions
|
@ -38,9 +38,18 @@ do_linesegmentation() {
|
|||
#ocrd workspace validate mets.xml
|
||||
}
|
||||
|
||||
do_ocr() {
|
||||
ocrd_tesserocr_recognize_parameters='{ "model": "eng" }' # TODO mods:language + fontident → model
|
||||
remove_filegrp OCR-D-OCR-TESS mets.xml
|
||||
ocrd-tesserocr-recognize -l DEBUG \
|
||||
-m mets.xml -I OCR-D-SEG-LINE -O OCR-D-OCR-TESS \
|
||||
-p <(echo $ocrd_tesserocr_recognize_parameters)
|
||||
#ocrd workspace validate mets.xml
|
||||
}
|
||||
|
||||
do_fontident
|
||||
do_linesegmentation
|
||||
do_ocr
|
||||
|
||||
|
||||
# XXX Multiple calls create multiple identical mets:agent elements
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue