1
0
Fork 0
mirror of https://github.com/qurator-spk/dinglehopper.git synced 2025-06-09 20:00:01 +02:00

🧹 dinglehopper: Remove obsolete XXX about the PAGE hierarchy

This commit is contained in:
Gerber, Mike 2020-06-12 17:04:07 +02:00
parent 453247c2f3
commit bc05f83088

View file

@ -151,7 +151,6 @@ def page_extract(tree):
for region in tree.iterfind('.//page:TextRegion', namespaces=nsmap):
regions.append(ExtractedTextSegment.from_text_segment(region, nsmap))
# XXX Does a file have to have regions etc.? region vs lines etc.
# Filter empty region texts
regions = [r for r in regions if r.text is not None]