{ "version": "0.0.1", "git_url": "https://github.com/qurator-spk/page2tsv", "tools": { "ocrd-neat-export": { "executable": "ocrd-neat-export", "description": "Convert PAGE-XML to neat-loadable TSV", "categories": [ "Format-Conversion" ], "steps": [ "format-conversion" ], "input_file_grp": ["INPUT"], "output_file_grp": ["OUTPUT"], "parameters": { "iiif_url_template": { "type": "string", "description": "URL template for lookup of images via IIIF based on {{ unique_identifier }}, {{ page_id }}, {{ page_no }} and {{ PPN }}. 'left', 'top', 'right', 'bottom', 'width', and 'height' are replaced by the neat JS.", "default": "https://content.staatsbibliothek-berlin.de/dc/{{ PPN }}-{{ page_no }}/left,top,width,height/full/0/default.jpg" }, "scale_filegrp": { "type": "string", "description": "If the OCR was run on images with a different resolution thant the 'full' IIIF size, use the images in this file group to scale. Set to empty string to disable", "default": "" }, "noproxy": { "type": "boolean", "description": "Disable proxy if set", "default": true } } }, "ocrd-neat-import": { "executable": "ocrd-neat-export", "description": "Re-integrate TSV into PAGE-XML", "categories": [ "Format-Conversion" ], "steps": [ "format-conversion" ], "input_file_grp": ["PAGE-GRP,TSV-GRP"], "output_file_grp": ["OUTPUT"], "parameters": { "keep_words": { "type": "boolean", "description": "After updating the line TextEquiv, remove (false) or keep (true) existing and probably inconsistent pc:Word", "default": false } } } } }