🐛 cli_line_dirs: Fix word differences section

At the time of generation of the section, the {gt,ocr}_words generators were drained. Fix by using a list. Fixes gh-124.
2025-07-13 04:19:59 +02:00 · 2024-12-12 19:57:12 +01:00 · 2024-12-12 19:57:12 +01:00 · f68c2b90bd
commit f68c2b90bd
parent 7dba6a7564
1 changed files with 3 additions and 3 deletions
--- a/src/dinglehopper/cli_line_dirs.py
+++ b/src/dinglehopper/cli_line_dirs.py
@ -1,6 +1,6 @@
 import itertools
 import os
-from typing import Callable, Iterator, Optional, Tuple
+from typing import Callable, Iterator, Optional, Tuple, List
 import click
 from jinja2 import Environment, FileSystemLoader
@ -127,8 +127,8 @@ def process(
    for k, (gt_fn, ocr_fn) in enumerate(gt_ocr_files):
        gt_text = plain_extract(gt_fn, include_filename_in_id=True)
        ocr_text = plain_extract(ocr_fn, include_filename_in_id=True)
-        gt_words = words_normalized(gt_text)
+        gt_words: List[str] = list(words_normalized(gt_text))
-        ocr_words = words_normalized(ocr_text)
+        ocr_words: List[str] = list(words_normalized(ocr_text))
        # Compute CER
        l_cer, l_n_characters = character_error_rate_n(gt_text, ocr_text)