From 735e9599d794ff7864f4d600d894f54912a31c1d Mon Sep 17 00:00:00 2001 From: "Gerber, Mike" Date: Wed, 9 Oct 2019 13:36:54 +0200 Subject: [PATCH] =?UTF-8?q?=F0=9F=90=9B=20ocrd-bugs:=20Most/All=20workspac?= =?UTF-8?q?es=20in=20bag=20files=20don't=20validate?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- ocrd-bugs/page-files-as-jpeg.sh | 16 ++++++++++++++++ 1 file changed, 16 insertions(+) create mode 100644 ocrd-bugs/page-files-as-jpeg.sh diff --git a/ocrd-bugs/page-files-as-jpeg.sh b/ocrd-bugs/page-files-as-jpeg.sh new file mode 100644 index 0000000..9969a80 --- /dev/null +++ b/ocrd-bugs/page-files-as-jpeg.sh @@ -0,0 +1,16 @@ +#!/bin/sh +# Most/All workspaces in bag files don't validate +# https://github.com/OCR-D/assets/issues/63 + +set -e + +cd `mktemp -d` +virtualenv venv +. venv/bin/activate +pip install --pre ocrd + +wget https://ocr-d-repo.scc.kit.edu/api/v1/dataresources/558280e0-c40a-49ae-81ab-679bc29567c3/data/gerstner_mechanik01_1831.zip +dtrx gerstner_mechanik01_1831.zip + +cd gerstner_mechanik01_1831/data +ocrd workspace validate mets.xml