mirror of
https://github.com/qurator-spk/ocrd-galley.git
synced 2025-07-05 19:19:53 +02:00
✨ Use dinglehopper's new OCR-D interface
This commit is contained in:
parent
d5aa273b44
commit
85ff80d548
3 changed files with 4 additions and 16 deletions
|
@ -20,10 +20,5 @@ RUN pip3 install --no-cache-dir -r /tmp/requirements.txt
|
||||||
COPY my_ocrd_workflow /usr/bin
|
COPY my_ocrd_workflow /usr/bin
|
||||||
COPY xsd /usr/bin/xsd
|
COPY xsd /usr/bin/xsd
|
||||||
|
|
||||||
# XXX Hack
|
|
||||||
COPY ../experiments/ocr-eval /usr/local/ocr-eval
|
|
||||||
RUN pip3 install --no-cache-dir -r /usr/local/ocr-eval/requirements.txt
|
|
||||||
|
|
||||||
|
|
||||||
WORKDIR /data
|
WORKDIR /data
|
||||||
CMD ["/usr/bin/my_ocrd_workflow"]
|
CMD ["/usr/bin/my_ocrd_workflow"]
|
||||||
|
|
|
@ -155,17 +155,8 @@ do_validate
|
||||||
|
|
||||||
|
|
||||||
if ocrd workspace list-group | grep -q OCR-D-GT-PAGE; then
|
if ocrd workspace list-group | grep -q OCR-D-GT-PAGE; then
|
||||||
for g in `ocrd workspace list-page`; do
|
remove_filegrp OCR-D-OCR-TESS-EVAL mets.xml
|
||||||
echo "== $g"
|
ocrd-dinglehopper -m mets.xml -I OCR-D-GT-PAGE,OCR-D-OCR-TESS -O OCR-D-OCR-TESS-EVAL
|
||||||
gt=`ocrd workspace find -G OCR-D-GT-PAGE -g $g`
|
|
||||||
ocr=`ocrd workspace find -G OCR-D-OCR-TESS -g $g`
|
|
||||||
|
|
||||||
if [ -n "$gt" ]; then
|
|
||||||
python3 /usr/local/ocr-eval/cli.py $gt $ocr
|
|
||||||
mv report.json report-$g.json
|
|
||||||
mv report.html report-$g.html
|
|
||||||
fi
|
|
||||||
done
|
|
||||||
fi
|
fi
|
||||||
|
|
||||||
# vim:tw=120:
|
# vim:tw=120:
|
||||||
|
|
|
@ -6,3 +6,5 @@ https://github.com/mikegerber/ocrd_kraken/archive/fix/pass-down-page-id.tar.gz
|
||||||
|
|
||||||
tesserocr == 2.3.1 # 2.4.0 fails with Ubuntu 18.04's tesseract
|
tesserocr == 2.3.1 # 2.4.0 fails with Ubuntu 18.04's tesseract
|
||||||
ocrd_tesserocr
|
ocrd_tesserocr
|
||||||
|
|
||||||
|
https://github.com/qurator-spk/dinglehopper/archive/0f056b9.tar.gz
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue