From 1f12b0b1e8b58dac670a4058dfa3e4f08aa3f169 Mon Sep 17 00:00:00 2001 From: "Gerber, Mike" Date: Thu, 19 Nov 2020 18:11:41 +0100 Subject: [PATCH] =?UTF-8?q?=F0=9F=A7=B9=20Remove=20old=20OCR-D=20bug=20rep?= =?UTF-8?q?roducers?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../bug-lohenstein-ocrd-typegroups-classifier.sh | 13 ------------- ocrd-bugs/bug-ocropy-segment-breakage.sh | 10 ---------- ocrd-bugs/bug-ocropy-segment-littering.sh | 15 --------------- ocrd-bugs/bug-remote-image.sh | 7 ------- .../bug-tesserocr-segment-line-no-description.sh | 2 -- ...g-tesserocr-segment-line-should-give-error.sh | 6 ------ ocrd-bugs/page-files-as-jpeg.sh | 16 ---------------- 7 files changed, 69 deletions(-) delete mode 100644 ocrd-bugs/bug-lohenstein-ocrd-typegroups-classifier.sh delete mode 100644 ocrd-bugs/bug-ocropy-segment-breakage.sh delete mode 100644 ocrd-bugs/bug-ocropy-segment-littering.sh delete mode 100644 ocrd-bugs/bug-remote-image.sh delete mode 100644 ocrd-bugs/bug-tesserocr-segment-line-no-description.sh delete mode 100644 ocrd-bugs/bug-tesserocr-segment-line-should-give-error.sh delete mode 100644 ocrd-bugs/page-files-as-jpeg.sh diff --git a/ocrd-bugs/bug-lohenstein-ocrd-typegroups-classifier.sh b/ocrd-bugs/bug-lohenstein-ocrd-typegroups-classifier.sh deleted file mode 100644 index d7fb9ab..0000000 --- a/ocrd-bugs/bug-lohenstein-ocrd-typegroups-classifier.sh +++ /dev/null @@ -1,13 +0,0 @@ -#!/bin/bash -x -cd `mktemp -d` -wget https://ocr-d-repo.scc.kit.edu/api/v1/dataresources/8d8aa287-94ca-48e3-84a8-1ee602871550/data/lohenstein_agrippina_1665.ocrd.zip -dtrx lohenstein_agrippina_1665.ocrd.zip -cd lohenstein_agrippina_1665.ocrd/data -ocrd_typegroups_classifier_parameters=' - { - "network": "/home/mike/devel/OCR-D/monorepo/ocrd_typegroups_classifier/ocrd_typegroups_classifier/models/classifier.tgc", - "stride":143 - }' -ocrd-typegroups-classifier -l DEBUG \ - -m mets.xml -I OCR-D-IMG -O OCR-D-FONTIDENT \ - -p <(echo $ocrd_typegroups_classifier_parameters) diff --git a/ocrd-bugs/bug-ocropy-segment-breakage.sh b/ocrd-bugs/bug-ocropy-segment-breakage.sh deleted file mode 100644 index 18da71d..0000000 --- a/ocrd-bugs/bug-ocropy-segment-breakage.sh +++ /dev/null @@ -1,10 +0,0 @@ -# zips all from https://ocr-d-repo.scc.kit.edu/api/v1/metastore/bagit -for z in benner_herrnhuterey04_1748.ocrd.zip buerger_gedichte_1778.ocrd.zip estor_rechtsgelehrsamkeit02_1758.ocrd.zip lohenstein_agrippina_1665.ocrd.zip silesius_seelenlust01_1657.ocrd.zip; do - echo "== $z" - cd `mktemp -d` - cp /srv/data/OCR-D/$z . - dtrx $z - cd ${z//.zip}/data - - ocrd-ocropy-segment -l DEBUG -m mets.xml -I OCR-D-IMG -O OCR-D-SEG-LINE 2>&1 | tail -n 1 -done diff --git a/ocrd-bugs/bug-ocropy-segment-littering.sh b/ocrd-bugs/bug-ocropy-segment-littering.sh deleted file mode 100644 index 50ec27b..0000000 --- a/ocrd-bugs/bug-ocropy-segment-littering.sh +++ /dev/null @@ -1,15 +0,0 @@ -#!/bin/bash -x -cd `mktemp -d` - -virtualenv -p /usr/bin/python3 venv -. venv/bin/activate -pip install ocrd-ocropy - -wget https://ocr-d-repo.scc.kit.edu/api/v1/dataresources/1b0fb8b5-3397-4c99-9ec3-24d5954ac0fb/data/bernd_lebensbeschreibung_1738.ocrd.zip -dtrx bernd_lebensbeschreibung_1738.ocrd.zip - -cd bernd_lebensbeschreibung_1738.ocrd/data -ocrd-ocropy-segment -m mets.xml -I OCR-D-IMG -O OCR-D-SEG-LINES - -pip list | grep ocrd -ls -l diff --git a/ocrd-bugs/bug-remote-image.sh b/ocrd-bugs/bug-remote-image.sh deleted file mode 100644 index 6a3fd37..0000000 --- a/ocrd-bugs/bug-remote-image.sh +++ /dev/null @@ -1,7 +0,0 @@ -#!/bin/sh -set -x -cd `mktemp -d` -wget -q https://ocr-d-repo.scc.kit.edu/api/v1/dataresources/f15fb8c8-3842-4314-9a44-5e8b472d7bfc/data/buerger_gedichte_1778.ocrd.zip -dtrx buerger_gedichte_1778.ocrd.zip -cd buerger_gedichte_1778.ocrd/data -ocrd workspace validate mets.xml diff --git a/ocrd-bugs/bug-tesserocr-segment-line-no-description.sh b/ocrd-bugs/bug-tesserocr-segment-line-no-description.sh deleted file mode 100644 index c45a90b..0000000 --- a/ocrd-bugs/bug-tesserocr-segment-line-no-description.sh +++ /dev/null @@ -1,2 +0,0 @@ -#!/bin/bash -x -ocrd-tesserocr-segment-line --help diff --git a/ocrd-bugs/bug-tesserocr-segment-line-should-give-error.sh b/ocrd-bugs/bug-tesserocr-segment-line-should-give-error.sh deleted file mode 100644 index a5b916b..0000000 --- a/ocrd-bugs/bug-tesserocr-segment-line-should-give-error.sh +++ /dev/null @@ -1,6 +0,0 @@ -#!/bin/bash -x -cd `mktemp -d` -wget https://ocr-d-repo.scc.kit.edu/api/v1/dataresources/8d8aa287-94ca-48e3-84a8-1ee602871550/data/lohenstein_agrippina_1665.ocrd.zip -dtrx lohenstein_agrippina_1665.ocrd.zip -cd lohenstein_agrippina_1665.ocrd/data -ocrd-tesserocr-segment-line -l DEBUG -m mets.xml -I DOES-NOT-EXIST -O OCR-D-SEG-REGION diff --git a/ocrd-bugs/page-files-as-jpeg.sh b/ocrd-bugs/page-files-as-jpeg.sh deleted file mode 100644 index 9969a80..0000000 --- a/ocrd-bugs/page-files-as-jpeg.sh +++ /dev/null @@ -1,16 +0,0 @@ -#!/bin/sh -# Most/All workspaces in bag files don't validate -# https://github.com/OCR-D/assets/issues/63 - -set -e - -cd `mktemp -d` -virtualenv venv -. venv/bin/activate -pip install --pre ocrd - -wget https://ocr-d-repo.scc.kit.edu/api/v1/dataresources/558280e0-c40a-49ae-81ab-679bc29567c3/data/gerstner_mechanik01_1831.zip -dtrx gerstner_mechanik01_1831.zip - -cd gerstner_mechanik01_1831/data -ocrd workspace validate mets.xml