|
|
@ -34,8 +34,8 @@ class OcrdDinglehopperEvaluate(Processor):
|
|
|
|
metrics = self.parameter['metrics']
|
|
|
|
metrics = self.parameter['metrics']
|
|
|
|
gt_grp, ocr_grp = self.input_file_grp.split(',')
|
|
|
|
gt_grp, ocr_grp = self.input_file_grp.split(',')
|
|
|
|
for n, page_id in enumerate(self.workspace.mets.physical_pages):
|
|
|
|
for n, page_id in enumerate(self.workspace.mets.physical_pages):
|
|
|
|
gt_file = self.workspace.mets.find_files(fileGrp=gt_grp, pageId=page_id)[0]
|
|
|
|
gt_file = next(self.workspace.mets.find_files(fileGrp=gt_grp, pageId=page_id))
|
|
|
|
ocr_file = self.workspace.mets.find_files(fileGrp=ocr_grp, pageId=page_id)[0]
|
|
|
|
ocr_file = next(self.workspace.mets.find_files(fileGrp=ocr_grp, pageId=page_id))
|
|
|
|
gt_file = self.workspace.download_file(gt_file)
|
|
|
|
gt_file = self.workspace.download_file(gt_file)
|
|
|
|
ocr_file = self.workspace.download_file(ocr_file)
|
|
|
|
ocr_file = self.workspace.download_file(ocr_file)
|
|
|
|
log.info("INPUT FILES %i / %s↔ %s", n, gt_file, ocr_file)
|
|
|
|
log.info("INPUT FILES %i / %s↔ %s", n, gt_file, ocr_file)
|
|
|
|