🧹 Remove font identification for now

pull/27/head
Gerber, Mike 5 years ago
parent 07555e8270
commit b468d688f2

@ -43,25 +43,6 @@ do_binarization() {
-p '{"impl": "sauvola-ms-split"}' -p '{"impl": "sauvola-ms-split"}'
} }
do_fontident() {
# Identify fonts in the images
network=`python3 -c "import ocrd_typegroups_classifier, os; print(os.path.join(os.path.dirname(ocrd_typegroups_classifier.__file__), 'models', 'classifier.tgc'))"`
ocrd_typegroups_classifier_parameters="
{
\"network\": \"$network\",
\"stride\": 143
}"
remove_filegrp OCR-D-OCR-FONTIDENT mets.xml
ocrd-typegroups-classifier -l $LOG_LEVEL \
-m mets.xml -I OCR-D-IMG -O OCR-D-OCR-FONTIDENT \
-p "$ocrd_typegroups_classifier_parameters"
# XXX Check if ocrd-typegroups-classifier uses the whole image
# XXX does DEFAULT have any meaning? /buerger_gedichte_1778.ocrd does not have
# any DEFAULT, yet -I DEFAULT seems to work for ocrd-typegroups-classifier
}
do_linesegmentation_tesserocr() { do_linesegmentation_tesserocr() {
# Segment the lines in the binarized images # Segment the lines in the binarized images
@ -145,10 +126,6 @@ page_upgrade_to_2019() {
pip3 list pip3 list
#do_fontident
#do_validate
do_binarization do_binarization
do_validate do_validate

@ -2,8 +2,6 @@ tensorflow-gpu < 2.0 # Needed for sbb_text_linedetector
ocrd >= 2.0.0 ocrd >= 2.0.0
https://github.com/mikegerber/ocrd_typegroups_classifier/archive/fix/pass-down-page-id.tar.gz # XXX git+https://github.com/seuretm/ocrd_typegroups_classifier.git
https://github.com/mikegerber/ocrd_kraken/archive/fix/pass-down-page-id.tar.gz # XXX ocrd_kraken >= 0.1.1 https://github.com/mikegerber/ocrd_kraken/archive/fix/pass-down-page-id.tar.gz # XXX ocrd_kraken >= 0.1.1
ocrd_tesserocr ocrd_tesserocr

Loading…
Cancel
Save