✨ sbb_textline_detector: Add a OCR-D interface

2026-02-23 09:21:55 +01:00 · 2019-10-10 17:54:42 +02:00 · 2019-10-10 17:54:42 +02:00 · 0c915c75de
commit 0c915c75de
parent 561a6f8a90
7 changed files with 98 additions and 11 deletions
--- a/ocrd-tool.json
+++ b/ocrd-tool.json
@ -0,0 +1 @@
 qurator/sbb_textline_detector/ocrd-tool.json
--- a/qurator/sbb_textline_detector/init.py
+++ b/qurator/sbb_textline_detector/init.py
@ -1 +1,2 @@
 from .main import *
 from .ocrd_cli import *
--- a/qurator/sbb_textline_detector/main.py
+++ b/qurator/sbb_textline_detector/main.py
@ -35,16 +35,18 @@ __doc__ = \
 class textlineerkenner:
-    def __init__(self, image_dir, dir_out, dir_models):
+    def __init__(self, image_dir, dir_out, f_name, dir_models):
        self.image_dir = image_dir
        self.dir_out = dir_out
-        self.dir_models = dir_models
+        self.f_name = f_name
        if self.f_name is None:
            try:
                self.f_name = image_dir.split('/')[len(image_dir.split('/')) - 1]
                self.f_name = self.f_name.split('.')[0]
                print(self.f_name)
            except:
                self.f_name = self.f_name.split('.')[0]
        self.dir_models = dir_models
        self.kernel = np.ones((5, 5), np.uint8)
        self.model_page_dir = dir_models + '/model_page.h5'
        self.model_region_dir = dir_models + '/model_strukturerkennung.h5'
@ -365,6 +367,7 @@ class textlineerkenner:
        return img_r
    def get_image_and_scales(self):
        print(self.image_dir)
        self.image = cv2.imread(self.image_dir)
        self.height_org = self.image.shape[0]
        self.width_org = self.image.shape[1]
@ -1298,7 +1301,7 @@ class textlineerkenner:
            unireg.text = ' '
        tree = ET.ElementTree(data)
-        tree.write(dir_of_image + self.f_name + ".xml")
+        tree.write(os.path.join(dir_of_image, self.f_name) + ".xml")
    def run(self):
        self.get_image_and_scales()
@ -1321,7 +1324,7 @@ class textlineerkenner:
 def main(image, out, model):
    possibles = globals()  # XXX unused?
    possibles.update(locals())
-    x = textlineerkenner(image, out, model)
+    x = textlineerkenner(image, out, None, model)
    x.run()
--- a/qurator/sbb_textline_detector/ocrd-tool.json
+++ b/qurator/sbb_textline_detector/ocrd-tool.json
@ -0,0 +1,19 @@
 {
  "version": "0.0.1",
  "tools": {
    "ocrd_sbb_textline_detector": {
      "executable": "ocrd_sbb_textline_detector",
      "description": "Detect lines",
      "steps": ["layout/segmentation/line"],
      "input_file_grp": [
        "OCR-D-IMG"
      ],
      "output_file_grp": [
        "OCR-D-SBB-SEG-LINE"
      ],
      "parameters": {
        "model": {"type": "string", "format": "file", "cacheable": true}
      }
    }
  }
 }
--- a/qurator/sbb_textline_detector/ocrd_cli.py
+++ b/qurator/sbb_textline_detector/ocrd_cli.py
@ -0,0 +1,61 @@
 import json
 import os
 import click
 from ocrd import Processor
 from ocrd.decorators import ocrd_cli_options, ocrd_cli_wrap_processor
 from ocrd_utils import concat_padded, getLogger
 from pkg_resources import resource_string
 from qurator.sbb_textline_detector import textlineerkenner
 log = getLogger('processor.OcrdSbbTextlineDetectorRecognize')
 OCRD_TOOL = json.loads(resource_string(__name__, 'ocrd-tool.json').decode('utf8'))
@click.command()
@ocrd_cli_options
 def ocrd_sbb_textline_detector(*args, **kwargs):
    return ocrd_cli_wrap_processor(OcrdSbbTextlineDetectorRecognize, *args, **kwargs)
 class OcrdSbbTextlineDetectorRecognize(Processor):
    def __init__(self, *args, **kwargs):
        kwargs['ocrd_tool'] = OCRD_TOOL['tools']['ocrd_sbb_textline_detector']
        super(OcrdSbbTextlineDetectorRecognize, self).__init__(*args, **kwargs)
    def _make_file_id(self, input_file, input_file_grp, n):
        file_id = input_file.ID.replace(input_file_grp, self.output_file_grp)
        if file_id == input_file.ID:
            file_id = concat_padded(self.output_file_grp, n)
        return file_id
    def process(self):
        for n, page_id in enumerate(self.workspace.mets.physical_pages):
            image_file = self.workspace.mets.find_files(fileGrp=self.input_file_grp, pageId=page_id)[0]
            log.info("INPUT FILE %i / %s", n, image_file)
            file_id = self._make_file_id(image_file, self.output_file_grp, n)
            # Process the files
            try:
                os.mkdir(self.output_file_grp)
            except FileExistsError:
                pass
            model = self.parameter['model']
            x = textlineerkenner(image_file.local_filename, self.output_file_grp, file_id, model)
            x.run()
            self.workspace.add_file(
                 ID=file_id + '.xml',
                 file_grp=self.output_file_grp,
                 pageId=page_id,
                 mimetype='application/vnd.prima.page+xml',
                 local_filename=self.output_file_grp + '/' + file_id)
 if __name__ == '__main__':
    ocrd_sbb_textline_detector()
--- a/requirements.txt
+++ b/requirements.txt
@ -1,5 +1,5 @@
 opencv-python
-numpy<=1.14.5
+numpy
 matplotlib
 seaborn
 tqdm
@ -9,3 +9,4 @@ scikit-learn
 tensorflow-gpu < 2.0
 scipy
 click
 ocrd >= 1.0.0b19
--- a/setup.py
+++ b/setup.py
@ -21,6 +21,7 @@ setup(
    entry_points={
      'console_scripts': [
        "sbb_textline_detector=qurator.sbb_textline_detector:main",
        "ocrd_sbb_textline_detector=qurator.sbb_textline_detector:ocrd_sbb_textline_detector",
      ]
    },
    python_requires='>=3.6.0',
		`@ -0,0 +1 @@`
							`qurator/sbb_textline_detector/ocrd-tool.json`
`@ -1 +1,2 @@`
	`from .main import *`	`from .main import *`
		`from .ocrd_cli import *`