🚧 dinglehopper: WIP data structure for extracted text

2026-06-13 00:19:24 +02:00 · 2020-06-10 19:49:12 +02:00 · 2020-06-10 19:49:12 +02:00 · 8e3a19d7e9
commit 8e3a19d7e9
parent 93608ba697
2 changed files with 3 additions and 2 deletions
--- a/extracted_text.py
+++ b/extracted_text.py
@ -2,6 +2,9 @@ import attr
 import unicodedata
 # TODO handle grapheme cluster positions?
@attr.s(frozen=True)
 class ExtractedText:
    segments = attr.ib()
--- a/extracted_text_test.py
+++ b/extracted_text_test.py
@ -13,7 +13,5 @@ def test_text():
    assert test1.segment_id_for_pos(3) is None
    assert test1.segment_id_for_pos(10) == 's2'
 # TODO handle grapheme cluster positions?
 # ExtractedTextSegment('foo', unicodedata.normalize('NFD', 'Schlyñ'))
 ExtractedTextSegment('foo', unicodedata.normalize('NFC', 'Schlyñ'))