1
0
Fork 0
mirror of https://github.com/qurator-spk/dinglehopper.git synced 2025-06-09 11:50:00 +02:00

🐛 dinglehopper: Fix reading OCR-D workspace files when only URLs are provided

This commit is contained in:
Gerber, Mike 2020-06-09 17:13:22 +02:00
parent ea1cc32b91
commit f699697eb3

View file

@ -38,6 +38,8 @@ class OcrdDinglehopperEvaluate(Processor):
for n, page_id in enumerate(self.workspace.mets.physical_pages):
gt_file = self.workspace.mets.find_files(fileGrp=gt_grp, pageId=page_id)[0]
ocr_file = self.workspace.mets.find_files(fileGrp=ocr_grp, pageId=page_id)[0]
gt_file = self.workspace.download_file(gt_file)
ocr_file = self.workspace.download_file(ocr_file)
log.info("INPUT FILES %i / %s%s", n, gt_file, ocr_file)
file_id = self._make_file_id(ocr_file, ocr_grp, n)