mirror of
https://github.com/qurator-spk/eynollah.git
synced 2025-07-01 06:59:54 +02:00
exit early if no text regions found (to avoid segfault)
This commit is contained in:
parent
21efea8711
commit
25e967397d
1 changed files with 18 additions and 2 deletions
|
@ -5019,6 +5019,20 @@ class Eynollah:
|
|||
contours_only_text_parent_d = []
|
||||
contours_only_text_parent = []
|
||||
|
||||
if not len(contours_only_text_parent):
|
||||
# stop early
|
||||
empty_marginals = [[]] * len(polygons_of_marginals)
|
||||
if self.full_layout:
|
||||
pcgts = self.writer.build_pagexml_full_layout([], [], page_coord, [], [], [], [], [], [], polygons_of_images, contours_tables, [], polygons_of_marginals, empty_marginals, empty_marginals, [], [], [], cont_page, polygons_lines_xml, [])
|
||||
else:
|
||||
pcgts = self.writer.build_pagexml_no_full_layout([], page_coord, [], [], [], [], polygons_of_images, polygons_of_marginals, empty_marginals, empty_marginals, [], [], cont_page, polygons_lines_xml, contours_tables, [])
|
||||
self.logger.info("Job done in %.1fs", time.time() - t0)
|
||||
if self.dir_in:
|
||||
self.writer.write_pagexml(pcgts)
|
||||
continue
|
||||
else:
|
||||
return pcgts
|
||||
|
||||
#print("text region early 3 in %.1fs", time.time() - t0)
|
||||
if self.light_version:
|
||||
contours_only_text_parent = self.dilate_textregions_contours(contours_only_text_parent)
|
||||
|
@ -5164,10 +5178,12 @@ class Eynollah:
|
|||
all_found_textline_polygons_marginals, all_box_coord_marginals, slopes, slopes_h, slopes_marginals,
|
||||
cont_page, polygons_lines_xml, ocr_all_textlines)
|
||||
self.logger.info("Job done in %.1fs", time.time() - t0)
|
||||
if not self.dir_in:
|
||||
if self.dir_in:
|
||||
self.writer.write_pagexml(pcgts)
|
||||
continue
|
||||
else:
|
||||
return pcgts
|
||||
|
||||
|
||||
else:
|
||||
contours_only_text_parent_h = None
|
||||
if self.reading_order_machine_based:
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue