From 2f7d01c7cde54729d583afdc57a6c9f65e3db79a Mon Sep 17 00:00:00 2001 From: Kai Labusch Date: Fri, 10 Nov 2023 17:28:30 +0100 Subject: [PATCH] fix alto2tsv bug --- qurator/tsvtools/cli.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/qurator/tsvtools/cli.py b/qurator/tsvtools/cli.py index c45ecea..f62b83a 100644 --- a/qurator/tsvtools/cli.py +++ b/qurator/tsvtools/cli.py @@ -148,7 +148,9 @@ def alto2tsv(alto_xml_file, tsv_out_file, purpose, image_url, ner_rest_endpoint, for region_idx, region in alto_iterate_textblocks(alto_xml_file): - for line, line_id, l_left, l_right, l_top, l_bottom in alto_iterate_lines(region): + for line, _, l_left, l_right, l_top, l_bottom in alto_iterate_lines(region): + + line_id = len(line_info) line_info.append((len(urls), l_left, l_right, l_top, l_bottom, line_id))