From f699697eb337d5379eb99387a7b562e8774e4188 Mon Sep 17 00:00:00 2001 From: "Gerber, Mike" Date: Tue, 9 Jun 2020 17:13:22 +0200 Subject: [PATCH] =?UTF-8?q?=F0=9F=90=9B=20dinglehopper:=20Fix=20reading=20?= =?UTF-8?q?OCR-D=20workspace=20files=20when=20only=20URLs=20are=20provided?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- qurator/dinglehopper/ocrd_cli.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/qurator/dinglehopper/ocrd_cli.py b/qurator/dinglehopper/ocrd_cli.py index 8ab5cf2..a23dffd 100644 --- a/qurator/dinglehopper/ocrd_cli.py +++ b/qurator/dinglehopper/ocrd_cli.py @@ -38,6 +38,8 @@ class OcrdDinglehopperEvaluate(Processor): for n, page_id in enumerate(self.workspace.mets.physical_pages): gt_file = self.workspace.mets.find_files(fileGrp=gt_grp, pageId=page_id)[0] ocr_file = self.workspace.mets.find_files(fileGrp=ocr_grp, pageId=page_id)[0] + gt_file = self.workspace.download_file(gt_file) + ocr_file = self.workspace.download_file(ocr_file) log.info("INPUT FILES %i / %s↔ %s", n, gt_file, ocr_file) file_id = self._make_file_id(ocr_file, ocr_grp, n)