mirror of
https://github.com/qurator-spk/eynollah.git
synced 2025-08-28 19:39:55 +02:00
Merge pull request #171 from bertsky/ocrd-machine-based-ro
OCR-D processor: expose reading_order_machine_based
This commit is contained in:
commit
a2359ea4c4
2 changed files with 8 additions and 0 deletions
|
@ -74,6 +74,11 @@
|
||||||
"type": "boolean",
|
"type": "boolean",
|
||||||
"default": false,
|
"default": false,
|
||||||
"description": "ignore the special role of headings during reading order detection"
|
"description": "ignore the special role of headings during reading order detection"
|
||||||
|
},
|
||||||
|
"reading_order_machine_based": {
|
||||||
|
"type": "boolean",
|
||||||
|
"default": false,
|
||||||
|
"description": "use data-driven (rather than rule-based) reading order detection"
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"resources": [
|
"resources": [
|
||||||
|
|
|
@ -24,6 +24,7 @@ class EynollahProcessor(Processor):
|
||||||
allow_enhancement=self.parameter['allow_enhancement'],
|
allow_enhancement=self.parameter['allow_enhancement'],
|
||||||
curved_line=self.parameter['curved_line'],
|
curved_line=self.parameter['curved_line'],
|
||||||
right2left=self.parameter['right_to_left'],
|
right2left=self.parameter['right_to_left'],
|
||||||
|
reading_order_machine_based=self.parameter['reading_order_machine_based'],
|
||||||
ignore_page_extraction=self.parameter['ignore_page_extraction'],
|
ignore_page_extraction=self.parameter['ignore_page_extraction'],
|
||||||
light_version=self.parameter['light_version'],
|
light_version=self.parameter['light_version'],
|
||||||
textline_light=self.parameter['textline_light'],
|
textline_light=self.parameter['textline_light'],
|
||||||
|
@ -57,6 +58,8 @@ class EynollahProcessor(Processor):
|
||||||
- If ``ignore_page_extraction``, then attempt no cropping of the page.
|
- If ``ignore_page_extraction``, then attempt no cropping of the page.
|
||||||
- If ``curved_line``, then compute contour polygons for text lines
|
- If ``curved_line``, then compute contour polygons for text lines
|
||||||
instead of simple bounding boxes.
|
instead of simple bounding boxes.
|
||||||
|
- If ``reading_order_machine_based``, then detect reading order via
|
||||||
|
data-driven model instead of geometrical heuristics.
|
||||||
|
|
||||||
Produce a new output file by serialising the resulting hierarchy.
|
Produce a new output file by serialising the resulting hierarchy.
|
||||||
"""
|
"""
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue