mirror of
https://github.com/qurator-spk/dinglehopper.git
synced 2025-06-09 11:50:00 +02:00
🧹 dinglehopper: Remove obsolete XXX about the PAGE hierarchy
This commit is contained in:
parent
453247c2f3
commit
bc05f83088
1 changed files with 0 additions and 1 deletions
|
@ -151,7 +151,6 @@ def page_extract(tree):
|
|||
for region in tree.iterfind('.//page:TextRegion', namespaces=nsmap):
|
||||
regions.append(ExtractedTextSegment.from_text_segment(region, nsmap))
|
||||
|
||||
# XXX Does a file have to have regions etc.? region vs lines etc.
|
||||
# Filter empty region texts
|
||||
regions = [r for r in regions if r.text is not None]
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue