mirror of
				https://github.com/qurator-spk/sbb_pixelwise_segmentation.git
				synced 2025-10-24 23:14:20 +02:00 
			
		
		
		
	adding rest_as_paragraph and rest_as_graphic to elements
This commit is contained in:
		
							parent
							
								
									4e4490d740
								
							
						
					
					
						commit
						5aa6ee0010
					
				
					 2 changed files with 170 additions and 294 deletions
				
			
		|  | @ -1,9 +1,9 @@ | |||
| { | ||||
| "use_case": "layout", | ||||
| "textregions":{"paragraph":1, "heading": 2, "header":2,"drop-capital": 3, "marginalia":4 ,"page-number":1 , "catch-word":1 ,"footnote": 1, "footnote-continued": 1}, | ||||
| "imageregion":5, | ||||
| "separatorregion":6, | ||||
| "graphicregions" :{"handwritten-annotation":5, "decoration": 5, "signature": 5, "stamp": 5}, | ||||
| "artificial_class_on_boundry": ["paragraph","header", "heading", "marginalia", "page-number", "catch-word", "drop-capital","footnote", "footnote-continued"], | ||||
| "textregions":{ "rest_as_paragraph": 1, "header":2 , "heading":2 , "marginalia":3 }, | ||||
| "imageregion":4, | ||||
| "separatorregion":5, | ||||
| "graphicregions" :{"rest_as_decoration":6}, | ||||
| "artificial_class_on_boundry": ["paragraph"], | ||||
| "artificial_class_label":7 | ||||
| } | ||||
|  |  | |||
							
								
								
									
										454
									
								
								gt_gen_utils.py
									
										
									
									
									
								
							
							
						
						
									
										454
									
								
								gt_gen_utils.py
									
										
									
									
									
								
							|  | @ -180,7 +180,7 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                                     pass | ||||
| 
 | ||||
|                             if vv.tag == link + 'Point': | ||||
|                                 c_t_in.append([int(np.float(vv.attrib['x'])), int(np.float(vv.attrib['y']))]) | ||||
|                                 c_t_in.append([int(float(vv.attrib['x'])), int(float(vv.attrib['y']))]) | ||||
|                                 sumi += 1 | ||||
|                             elif vv.tag != link + 'Point' and sumi >= 1: | ||||
|                                 break | ||||
|  | @ -226,7 +226,6 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                 types_text_dict = config_params['textregions'] | ||||
|                 types_text = list(types_text_dict.keys()) | ||||
|                 types_text_label = list(types_text_dict.values()) | ||||
|                 print(types_text) | ||||
|             if 'graphicregions' in keys: | ||||
|                 types_graphic_dict = config_params['graphicregions'] | ||||
|                 types_graphic = list(types_graphic_dict.keys()) | ||||
|  | @ -235,41 +234,20 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                  | ||||
|             labels_rgb_color = [ (0,0,0), (255,0,0), (255,125,0), (255,0,125), (125,255,125), (125,125,0), (0,125,255), (0,125,0), (125,125,125), (255,0,255), (125,0,125), (0,255,0),(0,0,255), (0,255,255), (255,125,125),  (0,125,125), (0,255,125), (255,125,255), (125,255,0)] | ||||
|              | ||||
|              | ||||
|             region_tags=np.unique([x for x in alltags if x.endswith('Region')])    | ||||
| 
 | ||||
|             co_text_paragraph=[] | ||||
|             co_text_footnote=[] | ||||
|             co_text_footnote_con=[] | ||||
|             co_text_drop=[] | ||||
|             co_text_heading=[] | ||||
|             co_text_header=[] | ||||
|             co_text_marginalia=[] | ||||
|             co_text_catch=[] | ||||
|             co_text_page_number=[] | ||||
|             co_text_signature_mark=[] | ||||
|             co_text = {'drop-capital':[], "footnote":[], "footnote-continued":[], "heading":[], "signature-mark":[], "header":[], "catch-word":[], "page-number":[], "marginalia":[], "paragraph":[]} | ||||
|             co_graphic = {"handwritten-annotation":[], "decoration":[], "stamp":[], "signature":[]} | ||||
|             co_sep=[] | ||||
|             co_img=[] | ||||
|             co_table=[] | ||||
|             co_graphic_signature=[] | ||||
|             co_graphic_text_annotation=[] | ||||
|             co_graphic_decoration=[] | ||||
|             co_graphic_stamp=[] | ||||
|             co_noise=[] | ||||
|              | ||||
|             for tag in region_tags: | ||||
|                 if 'textregions' in keys: | ||||
|                     if tag.endswith('}TextRegion') or tag.endswith('}Textregion'): | ||||
|                         for nn in root1.iter(tag): | ||||
|                             c_t_in_drop=[] | ||||
|                             c_t_in_paragraph=[] | ||||
|                             c_t_in_heading=[] | ||||
|                             c_t_in_header=[] | ||||
|                             c_t_in_page_number=[] | ||||
|                             c_t_in_signature_mark=[] | ||||
|                             c_t_in_catch=[] | ||||
|                             c_t_in_marginalia=[] | ||||
|                             c_t_in_footnote=[] | ||||
|                             c_t_in_footnote_con=[] | ||||
|                             c_t_in = {'drop-capital':[], "footnote":[], "footnote-continued":[], "heading":[], "signature-mark":[], "header":[], "catch-word":[], "page-number":[], "marginalia":[], "paragraph":[]} | ||||
|                             sumi=0 | ||||
|                             for vv in nn.iter(): | ||||
|                                 # check the format of coords | ||||
|  | @ -277,143 +255,63 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                  | ||||
|                                     coords=bool(vv.attrib) | ||||
|                                     if coords: | ||||
|                                         #print('birda1') | ||||
|                                         p_h=vv.attrib['points'].split(' ') | ||||
|                                          | ||||
|                                         if "drop-capital" in types_text: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='drop-capital': | ||||
|                                                 c_t_in_drop.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                                  | ||||
|                                         if "footnote" in types_text: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='footnote': | ||||
|                                                 c_t_in_footnote.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                                  | ||||
|                                         if "footnote-continued" in types_text: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='footnote-continued': | ||||
|                                                 c_t_in_footnote_con.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                          | ||||
|                                         if "heading" in types_text: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='heading': | ||||
|                                                 c_t_in_heading.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                      | ||||
|                                         if "signature-mark" in types_text: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='signature-mark': | ||||
|                                                 c_t_in_signature_mark.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
| 
 | ||||
|                                         if "header" in types_text: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='header': | ||||
|                                                 c_t_in_header.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                          | ||||
|                                         if "catch-word" in types_text: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='catch-word': | ||||
|                                                 c_t_in_catch.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                      | ||||
|                                         if "page-number" in types_text: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='page-number': | ||||
|                                                 c_t_in_page_number.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
| 
 | ||||
|                                         if "marginalia" in types_text:     | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='marginalia': | ||||
|                                                 c_t_in_marginalia.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                              | ||||
|                                         if "paragraph" in types_text: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='paragraph': | ||||
|                                                 c_t_in_paragraph.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
| 
 | ||||
|                                         if "rest_as_paragraph" in types_text: | ||||
|                                             types_text_without_paragraph = [element for element in types_text if element!='rest_as_paragraph' and element!='paragraph'] | ||||
|                                             if len(types_text_without_paragraph) == 0: | ||||
|                                                 if "type" in nn.attrib: | ||||
|                                                     c_t_in['paragraph'].append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                             elif len(types_text_without_paragraph) >= 1: | ||||
|                                                 if "type" in nn.attrib: | ||||
|                                                     if nn.attrib['type'] in types_text_without_paragraph: | ||||
|                                                         c_t_in[nn.attrib['type']].append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                                     else: | ||||
|                                                         c_t_in['paragraph'].append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                                          | ||||
|                                         else: | ||||
|                                             if "type" in nn.attrib: | ||||
|                                                 c_t_in[nn.attrib['type']].append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                  | ||||
|                                         break | ||||
|                                     else: | ||||
|                                         pass | ||||
|                  | ||||
|                  | ||||
|                                  | ||||
|                                 if vv.tag==link+'Point': | ||||
|                                     if "drop-capital" in types_text: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='drop-capital': | ||||
|                                             c_t_in_drop.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                     if "rest_as_paragraph" in types_text: | ||||
|                                         types_text_without_paragraph = [element for element in types_text if element!='rest_as_paragraph' and element!='paragraph'] | ||||
|                                         if len(types_text_without_paragraph) == 0: | ||||
|                                             if "type" in nn.attrib: | ||||
|                                                 c_t_in['paragraph'].append( [ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ] ) | ||||
|                                                 sumi+=1 | ||||
|                                         elif len(types_text_without_paragraph) >= 1: | ||||
|                                             if "type" in nn.attrib: | ||||
|                                                 if nn.attrib['type'] in types_text_without_paragraph: | ||||
|                                                     c_t_in[nn.attrib['type']].append( [ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ] ) | ||||
|                                                     sumi+=1 | ||||
|                                                 else: | ||||
|                                                     c_t_in['paragraph'].append( [ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ] ) | ||||
|                                                     sumi+=1 | ||||
|                                                      | ||||
|                                     else: | ||||
|                                         if "type" in nn.attrib: | ||||
|                                             c_t_in[nn.attrib['type']].append( [ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ] ) | ||||
|                                             sumi+=1 | ||||
|                                              | ||||
|                                     if "footnote" in types_text: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='footnote': | ||||
|                                             c_t_in_footnote.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                             sumi+=1 | ||||
|                                          | ||||
|                                     if "footnote-continued" in types_text: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='footnote-continued': | ||||
|                                             c_t_in_footnote_con.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                             sumi+=1 | ||||
|                                              | ||||
|                                     if "heading" in types_text: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='heading': | ||||
|                                             c_t_in_heading.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                             sumi+=1 | ||||
|                                              | ||||
|                                     if "signature-mark" in types_text: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='signature-mark': | ||||
|                                             c_t_in_signature_mark.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                             sumi+=1 | ||||
|                                          | ||||
|                                     if "header" in types_text: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='header': | ||||
|                                             c_t_in_header.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                             sumi+=1 | ||||
|                                      | ||||
|                                     if "catch-word" in types_text: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='catch-word': | ||||
|                                             c_t_in_catch.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                             sumi+=1 | ||||
|                                              | ||||
|                                     if "page-number" in types_text: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='page-number': | ||||
|                                             c_t_in_page_number.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                             sumi+=1 | ||||
|                                      | ||||
|                                     if "marginalia" in types_text: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='marginalia': | ||||
|                                             c_t_in_marginalia.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                             sumi+=1 | ||||
|                                          | ||||
|                                     if "paragraph" in types_text: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='paragraph': | ||||
|                                             c_t_in_paragraph.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                             sumi+=1 | ||||
|                                          | ||||
| 
 | ||||
| 
 | ||||
|                                 elif vv.tag!=link+'Point' and sumi>=1: | ||||
|                                     break | ||||
|                  | ||||
|                             if len(c_t_in_drop)>0: | ||||
|                                 co_text_drop.append(np.array(c_t_in_drop)) | ||||
|                             if len(c_t_in_footnote_con)>0: | ||||
|                                 co_text_footnote_con.append(np.array(c_t_in_footnote_con)) | ||||
|                             if len(c_t_in_footnote)>0: | ||||
|                                 co_text_footnote.append(np.array(c_t_in_footnote)) | ||||
|                             if len(c_t_in_paragraph)>0: | ||||
|                                 co_text_paragraph.append(np.array(c_t_in_paragraph)) | ||||
|                             if len(c_t_in_heading)>0: | ||||
|                                 co_text_heading.append(np.array(c_t_in_heading)) | ||||
|                                  | ||||
|                             if len(c_t_in_header)>0: | ||||
|                                 co_text_header.append(np.array(c_t_in_header)) | ||||
|                             if len(c_t_in_page_number)>0: | ||||
|                                 co_text_page_number.append(np.array(c_t_in_page_number)) | ||||
|                             if len(c_t_in_catch)>0: | ||||
|                                 co_text_catch.append(np.array(c_t_in_catch)) | ||||
|                                  | ||||
|                             if len(c_t_in_signature_mark)>0: | ||||
|                                 co_text_signature_mark.append(np.array(c_t_in_signature_mark)) | ||||
|                                  | ||||
|                             if len(c_t_in_marginalia)>0: | ||||
|                                 co_text_marginalia.append(np.array(c_t_in_marginalia)) | ||||
|                                  | ||||
|                  | ||||
|                             for element_text in list(c_t_in.keys()): | ||||
|                                 if len(c_t_in[element_text])>0: | ||||
|                                     co_text[element_text].append(np.array(c_t_in[element_text])) | ||||
|                                      | ||||
|                 if 'graphicregions' in keys: | ||||
|                     if tag.endswith('}GraphicRegion') or tag.endswith('}graphicregion'): | ||||
|                         #print('sth') | ||||
|                         for nn in root1.iter(tag): | ||||
|                             c_t_in_stamp=[] | ||||
|                             c_t_in_text_annotation=[] | ||||
|                             c_t_in_decoration=[] | ||||
|                             c_t_in_signature=[] | ||||
|                             c_t_in_graphic = {"handwritten-annotation":[], "decoration":[], "stamp":[], "signature":[]} | ||||
|                             sumi=0 | ||||
|                             for vv in nn.iter(): | ||||
|                                 # check the format of coords | ||||
|  | @ -421,23 +319,22 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                                     coords=bool(vv.attrib) | ||||
|                                     if coords: | ||||
|                                         p_h=vv.attrib['points'].split(' ') | ||||
|                                         if "handwritten-annotation" in types_graphic: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='handwritten-annotation': | ||||
|                                                 c_t_in_text_annotation.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                          | ||||
|                                         if "decoration" in types_graphic: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='decoration': | ||||
|                                                 c_t_in_decoration.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
| 
 | ||||
|                                         if "stamp" in types_graphic: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='stamp': | ||||
|                                                 c_t_in_stamp.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                              | ||||
|                                         if "signature" in types_graphic: | ||||
|                                             if "type" in nn.attrib and nn.attrib['type']=='signature': | ||||
|                                                 c_t_in_signature.append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                      | ||||
|                                          | ||||
|                                         if "rest_as_decoration" in types_graphic: | ||||
|                                             types_graphic_without_decoration = [element for element in types_graphic if element!='rest_as_decoration' and element!='decoration'] | ||||
|                                             if len(types_graphic_without_decoration) == 0: | ||||
|                                                 if "type" in nn.attrib: | ||||
|                                                     c_t_in_graphic['decoration'].append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                             elif len(types_graphic_without_decoration) >= 1: | ||||
|                                                 if "type" in nn.attrib: | ||||
|                                                     if nn.attrib['type'] in types_graphic_without_decoration: | ||||
|                                                         c_t_in_graphic[nn.attrib['type']].append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                                     else: | ||||
|                                                         c_t_in_graphic['decoration'].append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) ) | ||||
|                                                          | ||||
|                                         else: | ||||
|                                             if "type" in nn.attrib: | ||||
|                                                 c_t_in_graphic[nn.attrib['type']].append( np.array( [ [ int(x.split(',')[0]) , int(x.split(',')[1]) ]  for x in p_h] ) )         | ||||
|                                          | ||||
|                                         break | ||||
|                                     else: | ||||
|  | @ -445,34 +342,33 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                  | ||||
|                  | ||||
|                                 if vv.tag==link+'Point': | ||||
|                                     if "handwritten-annotation" in types_graphic: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='handwritten-annotation': | ||||
|                                             c_t_in_text_annotation.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                     if "rest_as_decoration" in types_graphic: | ||||
|                                         types_graphic_without_decoration = [element for element in types_graphic if element!='rest_as_decoration' and element!='decoration'] | ||||
|                                         if len(types_graphic_without_decoration) == 0: | ||||
|                                             if "type" in nn.attrib: | ||||
|                                                 c_t_in_graphic['decoration'].append( [ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ] ) | ||||
|                                                 sumi+=1 | ||||
|                                         elif len(types_graphic_without_decoration) >= 1: | ||||
|                                             if "type" in nn.attrib: | ||||
|                                                 if nn.attrib['type'] in types_graphic_without_decoration: | ||||
|                                                     c_t_in_graphic[nn.attrib['type']].append( [ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ] ) | ||||
|                                                     sumi+=1 | ||||
|                                                 else: | ||||
|                                                     c_t_in_graphic['decoration'].append( [ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ] ) | ||||
|                                                     sumi+=1 | ||||
|                                                      | ||||
|                                     else: | ||||
|                                         if "type" in nn.attrib: | ||||
|                                             c_t_in_graphic[nn.attrib['type']].append( [ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ] )  | ||||
|                                             sumi+=1 | ||||
|                                              | ||||
|                                     if "decoration" in types_graphic:         | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='decoration': | ||||
|                                             c_t_in_decoration.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                             sumi+=1 | ||||
|                                          | ||||
|                                     if "stamp" in types_graphic: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='stamp': | ||||
|                                             c_t_in_stamp.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                             sumi+=1 | ||||
|                                          | ||||
|                                     if "signature" in types_graphic: | ||||
|                                         if "type" in nn.attrib and nn.attrib['type']=='signature': | ||||
|                                             c_t_in_signature.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                             sumi+=1 | ||||
|                                 elif vv.tag!=link+'Point' and sumi>=1: | ||||
|                                     break | ||||
|                                  | ||||
|                             for element_graphic in list(c_t_in_graphic.keys()): | ||||
|                                 if len(c_t_in_graphic[element_graphic])>0: | ||||
|                                     co_graphic[element_graphic].append(np.array(c_t_in_graphic[element_graphic])) | ||||
|                                      | ||||
|                             if len(c_t_in_text_annotation)>0: | ||||
|                                 co_graphic_text_annotation.append(np.array(c_t_in_text_annotation)) | ||||
|                             if len(c_t_in_decoration)>0: | ||||
|                                 co_graphic_decoration.append(np.array(c_t_in_decoration)) | ||||
|                             if len(c_t_in_stamp)>0: | ||||
|                                 co_graphic_stamp.append(np.array(c_t_in_stamp)) | ||||
|                             if len(c_t_in_signature)>0: | ||||
|                                 co_graphic_signature.append(np.array(c_t_in_signature)) | ||||
|              | ||||
|                 if 'imageregion' in keys: | ||||
|                     if tag.endswith('}ImageRegion') or tag.endswith('}imageregion'): | ||||
|  | @ -491,7 +387,7 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                  | ||||
|                  | ||||
|                                 if vv.tag==link+'Point': | ||||
|                                     c_t_in.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                     c_t_in.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                                     sumi+=1 | ||||
| 
 | ||||
|                                 elif vv.tag!=link+'Point' and sumi>=1: | ||||
|  | @ -517,7 +413,7 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                  | ||||
|                  | ||||
|                                 if vv.tag==link+'Point': | ||||
|                                     c_t_in.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                     c_t_in.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                                     sumi+=1 | ||||
| 
 | ||||
|                                 elif vv.tag!=link+'Point' and sumi>=1: | ||||
|  | @ -545,7 +441,7 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                  | ||||
|                  | ||||
|                                 if vv.tag==link+'Point': | ||||
|                                     c_t_in.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                     c_t_in.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                                     sumi+=1 | ||||
|                                 #print(vv.tag,'in') | ||||
|                                 elif vv.tag!=link+'Point' and sumi>=1: | ||||
|  | @ -571,7 +467,7 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                  | ||||
|                  | ||||
|                                 if vv.tag==link+'Point': | ||||
|                                     c_t_in.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                                     c_t_in.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                                     sumi+=1 | ||||
|                                 #print(vv.tag,'in') | ||||
|                                 elif vv.tag!=link+'Point' and sumi>=1: | ||||
|  | @ -583,59 +479,63 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                 if "paragraph" in elements_with_artificial_class: | ||||
|                     erosion_rate = 2 | ||||
|                     dilation_rate = 4 | ||||
|                     co_text_paragraph, img_boundary = update_region_contours(co_text_paragraph, img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                     co_text['paragraph'], img_boundary = update_region_contours(co_text['paragraph'], img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                 if "drop-capital" in elements_with_artificial_class: | ||||
|                     erosion_rate = 0 | ||||
|                     dilation_rate = 4 | ||||
|                     co_text_drop, img_boundary = update_region_contours(co_text_drop, img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                     co_text["drop-capital"], img_boundary = update_region_contours(co_text["drop-capital"], img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                 if "catch-word" in elements_with_artificial_class: | ||||
|                     erosion_rate = 0 | ||||
|                     dilation_rate = 4 | ||||
|                     co_text_catch, img_boundary = update_region_contours(co_text_catch, img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                     co_text["catch-word"], img_boundary = update_region_contours(co_text["catch-word"], img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                 if "page-number" in elements_with_artificial_class: | ||||
|                     erosion_rate = 0 | ||||
|                     dilation_rate = 4 | ||||
|                     co_text_page_number, img_boundary = update_region_contours(co_text_page_number, img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                     co_text["page-number"], img_boundary = update_region_contours(co_text["page-number"], img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                 if "header" in elements_with_artificial_class: | ||||
|                     erosion_rate = 1 | ||||
|                     dilation_rate = 4 | ||||
|                     co_text_header, img_boundary = update_region_contours(co_text_header, img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                     co_text["header"], img_boundary = update_region_contours(co_text["header"], img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                 if "heading" in elements_with_artificial_class: | ||||
|                     erosion_rate = 1 | ||||
|                     dilation_rate = 4 | ||||
|                     co_text_heading, img_boundary = update_region_contours(co_text_heading, img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                     co_text["heading"], img_boundary = update_region_contours(co_text["heading"], img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                 if "signature-mark" in elements_with_artificial_class: | ||||
|                     erosion_rate = 1 | ||||
|                     dilation_rate = 4 | ||||
|                     co_text_signature_mark, img_boundary = update_region_contours(co_text_signature_mark, img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                     co_text["signature-mark"], img_boundary = update_region_contours(co_text["signature-mark"], img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                 if "marginalia" in elements_with_artificial_class: | ||||
|                     erosion_rate = 2 | ||||
|                     dilation_rate = 4 | ||||
|                     co_text_marginalia, img_boundary = update_region_contours(co_text_marginalia, img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                     co_text["marginalia"], img_boundary = update_region_contours(co_text["marginalia"], img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                 if "footnote" in elements_with_artificial_class: | ||||
|                     erosion_rate = 2 | ||||
|                     dilation_rate = 4 | ||||
|                     co_text_footnote, img_boundary = update_region_contours(co_text_footnote, img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                     co_text["footnote"], img_boundary = update_region_contours(co_text["footnote"], img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                 if "footnote-continued" in elements_with_artificial_class: | ||||
|                     erosion_rate = 2 | ||||
|                     dilation_rate = 4 | ||||
|                     co_text_footnote_con, img_boundary = update_region_contours(co_text_footnote_con, img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                     co_text["footnote-continued"], img_boundary = update_region_contours(co_text["footnote-continued"], img_boundary, erosion_rate, dilation_rate, y_len, x_len ) | ||||
|                      | ||||
|                      | ||||
|                  | ||||
|             img = np.zeros( (y_len,x_len,3) )  | ||||
| 
 | ||||
|             if output_type == '3d': | ||||
|                  | ||||
|                 if 'graphicregions' in keys: | ||||
|                     if "handwritten-annotation" in types_graphic: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_graphic_text_annotation, color=labels_rgb_color[ config_params['graphicregions']['handwritten-annotation']]) | ||||
|                     if "signature" in types_graphic: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_graphic_signature, color=labels_rgb_color[ config_params['graphicregions']['signature']]) | ||||
|                     if "decoration" in types_graphic: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_graphic_decoration, color=labels_rgb_color[ config_params['graphicregions']['decoration']]) | ||||
|                     if "stamp" in types_graphic: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_graphic_stamp, color=labels_rgb_color[ config_params['graphicregions']['stamp']]) | ||||
|                     if 'rest_as_decoration' in types_graphic: | ||||
|                         types_graphic[types_graphic=='rest_as_decoration'] = 'decoration' | ||||
|                         for element_graphic in types_graphic: | ||||
|                             if element_graphic == 'decoration': | ||||
|                                 color_label = labels_rgb_color[ config_params['graphicregions']['rest_as_decoration']] | ||||
|                             else: | ||||
|                                 color_label = labels_rgb_color[ config_params['graphicregions'][element_graphic]] | ||||
|                             img_poly=cv2.fillPoly(img, pts =co_graphic[element_graphic], color=color_label) | ||||
|                     else: | ||||
|                         for element_graphic in types_graphic: | ||||
|                             color_label = labels_rgb_color[ config_params['graphicregions'][element_graphic]] | ||||
|                             img_poly=cv2.fillPoly(img, pts =co_graphic[element_graphic], color=color_label) | ||||
|                      | ||||
|                          | ||||
|                 if 'imageregion' in keys:  | ||||
|                     img_poly=cv2.fillPoly(img, pts =co_img, color=labels_rgb_color[ config_params['imageregion']]) | ||||
|  | @ -647,26 +547,19 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                     img_poly=cv2.fillPoly(img, pts =co_noise, color=labels_rgb_color[ config_params['noiseregion']]) | ||||
|                      | ||||
|                 if 'textregions' in keys: | ||||
|                     if "paragraph" in types_text: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_paragraph, color=labels_rgb_color[ config_params['textregions']['paragraph']]) | ||||
|                     if "footnote" in types_text: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_footnote, color=labels_rgb_color[ config_params['textregions']['footnote']]) | ||||
|                     if "footnote-continued" in types_text: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_footnote_con, color=labels_rgb_color[ config_params['textregions']['footnote-continued']]) | ||||
|                     if "heading" in types_text: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_heading, color=labels_rgb_color[ config_params['textregions']['heading']]) | ||||
|                     if "header" in types_text: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_header, color=labels_rgb_color[ config_params['textregions']['header']]) | ||||
|                     if "catch-word" in types_text: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_catch, color=labels_rgb_color[ config_params['textregions']['catch-word']]) | ||||
|                     if "signature-mark" in types_text: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_signature_mark, color=labels_rgb_color[ config_params['textregions']['signature-mark']]) | ||||
|                     if "page-number" in types_text: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_page_number, color=labels_rgb_color[ config_params['textregions']['page-number']]) | ||||
|                     if "marginalia" in types_text: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_marginalia, color=labels_rgb_color[ config_params['textregions']['marginalia']]) | ||||
|                     if "drop-capital" in types_text: | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_drop, color=labels_rgb_color[ config_params['textregions']['drop-capital']]) | ||||
|                     if 'rest_as_paragraph' in types_text: | ||||
|                         types_text[types_text=='rest_as_paragraph'] = 'paragraph' | ||||
|                         for element_text in types_text: | ||||
|                             if element_text == 'paragraph': | ||||
|                                 color_label = labels_rgb_color[ config_params['textregions']['rest_as_paragraph']] | ||||
|                             else: | ||||
|                                 color_label = labels_rgb_color[ config_params['textregions'][element_text]] | ||||
|                             img_poly=cv2.fillPoly(img, pts =co_text[element_text], color=color_label) | ||||
|                     else: | ||||
|                         for element_text in types_text: | ||||
|                             color_label = labels_rgb_color[ config_params['textregions'][element_text]] | ||||
|                             img_poly=cv2.fillPoly(img, pts =co_text[element_text], color=color_label) | ||||
|                          | ||||
|                          | ||||
|                 if "artificial_class_on_boundry" in keys: | ||||
|                     img_poly[:,:,0][img_boundary[:,:]==1] = artificial_class_rgb_color[0] | ||||
|  | @ -678,18 +571,19 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                  | ||||
|             elif output_type == '2d': | ||||
|                 if 'graphicregions' in keys: | ||||
|                     if "handwritten-annotation" in types_graphic: | ||||
|                         color_label = config_params['graphicregions']['handwritten-annotation'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_graphic_text_annotation, color=(color_label,color_label,color_label)) | ||||
|                     if "signature" in types_graphic: | ||||
|                         color_label = config_params['graphicregions']['signature'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_graphic_signature, color=(color_label,color_label,color_label)) | ||||
|                     if "decoration" in types_graphic: | ||||
|                         color_label = config_params['graphicregions']['decoration'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_graphic_decoration, color=(color_label,color_label,color_label)) | ||||
|                     if "stamp" in types_graphic: | ||||
|                         color_label = config_params['graphicregions']['stamp'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_graphic_stamp, color=(color_label,color_label,color_label)) | ||||
|                     if 'rest_as_decoration' in types_graphic: | ||||
|                         types_graphic[types_graphic=='rest_as_decoration'] = 'decoration' | ||||
|                         for element_graphic in types_graphic: | ||||
|                             if element_graphic == 'decoration': | ||||
|                                 color_label = config_params['graphicregions']['rest_as_decoration'] | ||||
|                             else: | ||||
|                                 color_label = config_params['graphicregions'][element_graphic] | ||||
|                             img_poly=cv2.fillPoly(img, pts =co_graphic[element_graphic], color=color_label) | ||||
|                     else: | ||||
|                         for element_graphic in types_graphic: | ||||
|                             color_label = config_params['graphicregions'][element_graphic] | ||||
|                             img_poly=cv2.fillPoly(img, pts =co_graphic[element_graphic], color=color_label) | ||||
|                              | ||||
|                  | ||||
|                 if 'imageregion' in keys: | ||||
|                     color_label = config_params['imageregion'] | ||||
|  | @ -705,36 +599,18 @@ def get_images_of_ground_truth(gt_list, dir_in, output_dir, output_type, config_ | |||
|                     img_poly=cv2.fillPoly(img, pts =co_noise, color=(color_label,color_label,color_label)) | ||||
|                      | ||||
|                 if 'textregions' in keys: | ||||
|                     if "paragraph" in types_text: | ||||
|                         color_label = config_params['textregions']['paragraph'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_paragraph, color=(color_label,color_label,color_label)) | ||||
|                     if "footnote" in types_text: | ||||
|                         color_label = config_params['textregions']['footnote'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_footnote, color=(color_label,color_label,color_label)) | ||||
|                     if "footnote-continued" in types_text: | ||||
|                         color_label = config_params['textregions']['footnote-continued'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_footnote_con, color=(color_label,color_label,color_label)) | ||||
|                     if "heading" in types_text: | ||||
|                         color_label = config_params['textregions']['heading'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_heading, color=(color_label,color_label,color_label)) | ||||
|                     if "header" in types_text: | ||||
|                         color_label = config_params['textregions']['header'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_header, color=(color_label,color_label,color_label)) | ||||
|                     if "catch-word" in types_text: | ||||
|                         color_label = config_params['textregions']['catch-word'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_catch, color=(color_label,color_label,color_label)) | ||||
|                     if "signature-mark" in types_text: | ||||
|                         color_label = config_params['textregions']['signature-mark'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_signature_mark, color=(color_label,color_label,color_label)) | ||||
|                     if "page-number" in types_text: | ||||
|                         color_label = config_params['textregions']['page-number'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_page_number, color=(color_label,color_label,color_label)) | ||||
|                     if "marginalia" in types_text: | ||||
|                         color_label = config_params['textregions']['marginalia'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_marginalia, color=(color_label,color_label,color_label)) | ||||
|                     if "drop-capital" in types_text: | ||||
|                         color_label = config_params['textregions']['drop-capital'] | ||||
|                         img_poly=cv2.fillPoly(img, pts =co_text_drop, color=(color_label,color_label,color_label)) | ||||
|                     if 'rest_as_paragraph' in types_text: | ||||
|                         types_text[types_text=='rest_as_paragraph'] = 'paragraph' | ||||
|                         for element_text in types_text: | ||||
|                             if element_text == 'paragraph': | ||||
|                                 color_label = config_params['textregions']['rest_as_paragraph'] | ||||
|                             else: | ||||
|                                 color_label = config_params['textregions'][element_text] | ||||
|                             img_poly=cv2.fillPoly(img, pts =co_text[element_text], color=color_label) | ||||
|                     else: | ||||
|                         for element_text in types_text: | ||||
|                             color_label = config_params['textregions'][element_text] | ||||
|                             img_poly=cv2.fillPoly(img, pts =co_text[element_text], color=color_label) | ||||
|                          | ||||
|                 if "artificial_class_on_boundry" in keys: | ||||
|                     img_poly[:,:][img_boundary[:,:]==1] = artificial_class_label | ||||
|  | @ -947,51 +823,51 @@ def read_xml(xml_file): | |||
|                         if "type" in nn.attrib and nn.attrib['type']=='drop-capital': | ||||
|                         #if nn.attrib['type']=='paragraph': | ||||
| 
 | ||||
|                             c_t_in_drop.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                             c_t_in_drop.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                             sumi+=1 | ||||
| 
 | ||||
|                         elif "type" in nn.attrib and nn.attrib['type']=='heading': | ||||
|                             id_heading.append(nn.attrib['id']) | ||||
|                             c_t_in_heading.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                             c_t_in_heading.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                             sumi+=1 | ||||
| 
 | ||||
| 
 | ||||
|                         elif "type" in nn.attrib and nn.attrib['type']=='signature-mark': | ||||
| 
 | ||||
|                             c_t_in_signature_mark.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                             c_t_in_signature_mark.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                             #print(c_t_in_paragraph) | ||||
|                             sumi+=1 | ||||
|                         elif "type" in nn.attrib and nn.attrib['type']=='header': | ||||
|                             id_header.append(nn.attrib['id']) | ||||
|                             c_t_in_header.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                             c_t_in_header.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                             sumi+=1 | ||||
| 
 | ||||
| 
 | ||||
|                         elif "type" in nn.attrib and nn.attrib['type']=='catch-word': | ||||
|                             c_t_in_catch.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                             c_t_in_catch.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                             sumi+=1 | ||||
| 
 | ||||
| 
 | ||||
|                         elif "type" in nn.attrib and nn.attrib['type']=='page-number': | ||||
| 
 | ||||
|                             c_t_in_page_number.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                             c_t_in_page_number.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                             #print(c_t_in_paragraph) | ||||
|                             sumi+=1 | ||||
| 
 | ||||
|                         elif "type" in nn.attrib and nn.attrib['type']=='marginalia': | ||||
|                             id_marginalia.append(nn.attrib['id']) | ||||
| 
 | ||||
|                             c_t_in_marginalia.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                             c_t_in_marginalia.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                             #print(c_t_in_paragraph) | ||||
|                             sumi+=1 | ||||
| 
 | ||||
|                         else: | ||||
|                             id_paragraph.append(nn.attrib['id']) | ||||
|                             c_t_in_paragraph.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                             c_t_in_paragraph.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                             #print(c_t_in_paragraph) | ||||
|                             sumi+=1 | ||||
| 
 | ||||
|                         #c_t_in.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                         #c_t_in.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
| 
 | ||||
|                     #print(vv.tag,'in') | ||||
|                     elif vv.tag!=link+'Point' and sumi>=1: | ||||
|  | @ -1057,16 +933,16 @@ def read_xml(xml_file): | |||
|                         if "type" in nn.attrib and nn.attrib['type']=='handwritten-annotation': | ||||
|                         #if nn.attrib['type']=='paragraph': | ||||
| 
 | ||||
|                             c_t_in_text_annotation.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                             c_t_in_text_annotation.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                             sumi+=1 | ||||
| 
 | ||||
|                         elif "type" in nn.attrib and nn.attrib['type']=='decoration': | ||||
| 
 | ||||
|                             c_t_in_decoration.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                             c_t_in_decoration.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                             #print(c_t_in_paragraph) | ||||
|                             sumi+=1 | ||||
|                         else: | ||||
|                             c_t_in.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                             c_t_in.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                             sumi+=1 | ||||
| 
 | ||||
|                 if len(c_t_in_text_annotation)>0: | ||||
|  | @ -1096,7 +972,7 @@ def read_xml(xml_file): | |||
| 
 | ||||
| 
 | ||||
|                     if vv.tag==link+'Point': | ||||
|                         c_t_in.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                         c_t_in.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                         sumi+=1 | ||||
|                     #print(vv.tag,'in') | ||||
|                     elif vv.tag!=link+'Point' and sumi>=1: | ||||
|  | @ -1123,7 +999,7 @@ def read_xml(xml_file): | |||
| 
 | ||||
| 
 | ||||
|                     if vv.tag==link+'Point': | ||||
|                         c_t_in.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                         c_t_in.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                         sumi+=1 | ||||
|                     #print(vv.tag,'in') | ||||
|                     elif vv.tag!=link+'Point' and sumi>=1: | ||||
|  | @ -1150,7 +1026,7 @@ def read_xml(xml_file): | |||
| 
 | ||||
| 
 | ||||
|                     if vv.tag==link+'Point': | ||||
|                         c_t_in.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                         c_t_in.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                         sumi+=1 | ||||
|                     #print(vv.tag,'in') | ||||
|                     elif vv.tag!=link+'Point' and sumi>=1: | ||||
|  | @ -1176,7 +1052,7 @@ def read_xml(xml_file): | |||
| 
 | ||||
| 
 | ||||
|                     if vv.tag==link+'Point': | ||||
|                         c_t_in.append([ int(np.float(vv.attrib['x'])) , int(np.float(vv.attrib['y'])) ]) | ||||
|                         c_t_in.append([ int(float(vv.attrib['x'])) , int(float(vv.attrib['y'])) ]) | ||||
|                         sumi+=1 | ||||
|                     #print(vv.tag,'in') | ||||
|                     elif vv.tag!=link+'Point' and sumi>=1: | ||||
|  |  | |||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue