37cc513ce9 
								
							 
						 
						
							
							
								
								🚧  sbb_textline_detector: Translate detected coordinates  
							
							
							
						 
						
							2020-10-15 19:26:24 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								a9b9c8a885 
								
							 
						 
						
							
							
								
								🚧  sbb_textline_detector: Get image via image_from_page  
							
							
							
						 
						
							2020-10-15 19:03:07 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Konstantin Baierer 
								
							 
						 
						
							
							
							
							
								
							
							
								f167f6768c 
								
							 
						 
						
							
							
								
								getLogger per method  
							
							
							
						 
						
							2020-09-24 10:53:45 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									vahidrezanezhad 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								0f09f4a1f6 
								
							 
						 
						
							
							
								
								Update main.py  
							
							... 
							
							
							
							Issues 30 and 40 are resolved 
							
						 
						
							2020-08-27 06:43:30 -04:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Clemens Neudecker 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								e4798c6811 
								
							 
						 
						
							
							
								
								replace 'PrintSpace' with 'Border'  
							
							
							
						 
						
							2020-08-18 17:05:20 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Clemens Neudecker 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								36adbe29d8 
								
							 
						 
						
							
							
								
								replace 'PrintSpace' with 'Border'  
							
							
							
						 
						
							2020-08-18 17:03:56 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Konstantin Baierer 
								
							 
						 
						
							
							
							
							
								
							
							
								05deb03ec8 
								
							 
						 
						
							
							
								
								use make_file_id and assert_file_grp_cardinality  
							
							
							
						 
						
							2020-08-11 15:06:34 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								8b01d9e671 
								
							 
						 
						
							
							
								
								🐛  sbb_textline_detection: Set pcGtsId  
							
							... 
							
							
							
							Newest OCR-D workspace validation requires that the pcGtsId of a
PAGE-XML file matches its METS mets:file/ID. Fix this by setting
it correctly. 
							
						 
						
							2020-08-05 17:16:40 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
								
								
							
							
							
								
							
							
								3593506e72 
								
							 
						 
						
							
							
								
								🔧  ocrd-tool.json: Update description, steps and categories  
							
							... 
							
							
							
							Fixes  #31 . 
						
							2020-05-29 17:30:53 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Lucas Sulzbach 
								
							 
						 
						
							
							
							
							
								
							
							
								ead1eae114 
								
							 
						 
						
							
							
								
								ocrd-tool.json: Make description OCR-D compliant  
							
							
							
						 
						
							2020-05-07 00:16:55 -03:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									vahidrezanezhad 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								f94944ee80 
								
							 
						 
						
							
							
								
								change scaling  
							
							
							
						 
						
							2020-04-11 02:52:41 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									b-vr103 
								
							 
						 
						
							
							
							
							
								
							
							
								b9caa8e12c 
								
							 
						 
						
							
							
								
								resolve 2020-02-17-bug-sbb_textline_detector  
							
							
							
						 
						
							2020-02-21 16:48:27 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									b-vr103 
								
							 
						 
						
							
							
							
							
								
							
							
								1446d7c662 
								
							 
						 
						
							
							
								
								getting robust and doing sth for verticals  
							
							
							
						 
						
							2019-12-13 18:04:04 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									b-vr103 
								
							 
						 
						
							
							
							
							
								
							
							
								3941f2f17d 
								
							 
						 
						
							
							
								
								gettin robust and doing sth for verticals  
							
							
							
						 
						
							2019-12-13 17:49:19 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								f90b3cfa86 
								
							 
						 
						
							
							
								
								🔊  sbb_textline_detector: In OCR-D interface, warn if overwriting existing segmentation  
							
							
							
						 
						
							2019-12-11 13:54:29 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								11c0e9cee5 
								
							 
						 
						
							
							
								
								🐛  sbb_textline_detector: Do not print PAGE output to stdout  
							
							... 
							
							
							
							ocrd-sbb-textline-detector uses ocrd_page's parse() to parse XML input,
which writes the XML to stdout by default.
Fix this by silencing it using parse()'s silence=True. 
							
						 
						
							2019-12-11 12:39:50 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									wrznr 
								
							 
						 
						
							
							
							
							
								
							
							
								4fc57d7756 
								
							 
						 
						
							
							
								
								Assign page id  
							
							
							
						 
						
							2019-12-10 16:59:45 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									wrznr 
								
							 
						 
						
							
							
							
							
								
							
							
								9e9163e852 
								
							 
						 
						
							
							
								
								Simplify the iteration over files in the input file group  
							
							
							
						 
						
							2019-12-10 16:55:43 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
								
								
							
							
							
								
							
							
								6e0decb5ec 
								
							 
						 
						
							
							
								
								Merge pull request  #12  from kba/rename-tool  
							
							... 
							
							
							
							Rename ocrd_sbb.. to ocrd-sbb... in ocrd_cli.py, ht @bertsky 
							
						 
						
							2019-12-09 16:50:27 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								5fb30a7a1f 
								
							 
						 
						
							
							
								
								Revert "Merge branch 'master' of  https://github.com/qurator-spk/sbb_textline_detector "  
							
							... 
							
							
							
							This reverts commit 417b9235d5a74974b7b6 
							
						 
						
							2019-12-09 15:11:25 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Konstantin Baierer 
								
							 
						 
						
							
							
							
							
								
							
							
								cf6381c148 
								
							 
						 
						
							
							
								
								Rename ocrd_sbb.. to ocrd-sbb... in ocrd_cli.py, ht @bertsky  
							
							
							
						 
						
							2019-12-09 13:02:44 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Clemens Neudecker 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								51e241fd84 
								
							 
						 
						
							
							
								
								Merge pull request  #5  from cneud/cneud-fix-typos  
							
							... 
							
							
							
							Fix typos 
							
						 
						
							2019-12-06 19:45:14 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Clemens Neudecker 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								12c07f389d 
								
							 
						 
						
							
							
								
								Merge pull request  #7  from cneud/cneud-fix-docstring  
							
							... 
							
							
							
							fix docstring 
							
						 
						
							2019-12-06 19:44:34 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Clemens Neudecker 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								29870f26e1 
								
							 
						 
						
							
							
								
								Merge pull request  #4  from cneud/cneud-PAGE2019  
							
							... 
							
							
							
							PAGE2019 
							
						 
						
							2019-12-06 19:44:04 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Konstantin Baierer 
								
							 
						 
						
							
							
							
							
								
							
							
								b6ca1a7c53 
								
							 
						 
						
							
							
								
								kebab-case snake_case executable,  fix   #9  
							
							
							
						 
						
							2019-12-06 18:26:09 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Clemens Neudecker 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								6c0bfba686 
								
							 
						 
						
							
							
								
								fix typos  
							
							
							
						 
						
							2019-12-06 02:21:04 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Clemens Neudecker 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								c8bc468628 
								
							 
						 
						
							
							
								
								fix docstring  
							
							
							
						 
						
							2019-12-06 00:40:05 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Clemens Neudecker 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								e696a068cb 
								
							 
						 
						
							
							
								
								Fix typos  
							
							
							
						 
						
							2019-12-06 00:20:34 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Clemens Neudecker 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								d90dad48fd 
								
							 
						 
						
							
							
								
								PAGE2019  
							
							
							
						 
						
							2019-12-05 22:24:28 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Rezanezhad, Vahid 
								
							 
						 
						
							
							
							
							
								
							
							
								19116091f9 
								
							 
						 
						
							
							
								
								Update config_params.json  
							
							
							
						 
						
							2019-12-05 14:05:55 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								af5cbe9052 
								
							 
						 
						
							
							
								
								🐛  sbb_textline_detector: Fix making the output file id  
							
							
							
						 
						
							2019-12-04 11:42:45 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Rezanezhad, Vahid 
								
							 
						 
						
							
							
							
							
								
							
							
								2112bb18c6 
								
							 
						 
						
							
							
								
								fixed the bug: local variable 't4' referenced before assignment  
							
							
							
						 
						
							2019-11-29 11:29:12 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Rezanezhad, Vahid 
								
							 
						 
						
							
							
							
							
								
							
							
								a11f6740cb 
								
							 
						 
						
							
							
								
								Update main.py - robust deskewing and better page extraction  
							
							
							
						 
						
							2019-11-28 16:19:44 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Rezanezhad, Vahid 
								
							 
						 
						
							
							
							
							
								
							
							
								0182b7087f 
								
							 
						 
						
							
							
								
								remove multiprocessing bug  
							
							
							
						 
						
							2019-11-20 14:05:15 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								8fa7179560 
								
							 
						 
						
							
							
								
								🐛  sbb_textline_detector: Disable multiprocessing to fix race condition  
							
							... 
							
							
							
							Lines were sorted in the wrong regions. Work around this by disabling
multiprocessing until a proper fix is done. 
							
						 
						
							2019-11-20 09:50:29 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								4aed06a325 
								
							 
						 
						
							
							
								
								✨  sbb_textline_detection: Preserve input PAGE info by merging segmentation results  
							
							... 
							
							
							
							ocrd_sbb_textline_detection used the output XML by main.py as is, and
– by doing this – threw away any input data from the input PAGE,
including the critical pc:AlternativeImage and the less important
pc:MetadataItem.
Fix this by merging the segmentation results into a file created from
the input file.
Also add a pc:MetadataItem processingStep about the segmentation
operation. 
							
						 
						
							2019-11-19 15:08:53 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								4fb3e70ef6 
								
							 
						 
						
							
							
								
								🧹  sbb_textline_detector: Do not create empty/space-only TextEquivs (again)  
							
							
							
						 
						
							2019-11-19 11:08:41 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								bf41a29e7b 
								
							 
						 
						
							
							
								
								🐛  sbb_textline_detector: Do not hardcode Created/LastChange elements  
							
							
							
						 
						
							2019-11-19 11:05:18 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								fbd21cdb81 
								
							 
						 
						
							
							
								
								🧹  sbb_textline_detector: Do not create empty/space-only TextEquivs (again)  
							
							
							
						 
						
							2019-11-19 10:59:41 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Rezanezhad, Vahid 
								
							 
						 
						
							
							
							
							
								
							
							
								2d6dd92b31 
								
							 
						 
						
							
							
								
								Update main.py  
							
							
							
						 
						
							2019-11-04 11:10:17 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Rezanezhad, Vahid 
								
							 
						 
						
							
							
							
							
								
							
							
								9f97f34255 
								
							 
						 
						
							
							
								
								Update main.py  
							
							
							
						 
						
							2019-10-31 17:36:21 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Rezanezhad, Vahid 
								
							 
						 
						
							
							
							
							
								
							
							
								8c954a6c7a 
								
							 
						 
						
							
							
								
								Update main.py  
							
							
							
						 
						
							2019-10-31 17:08:35 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Rezanezhad, Vahid 
								
							 
						 
						
							
							
							
							
								
							
							
								6714481556 
								
							 
						 
						
							
							
								
								Update main.py  
							
							
							
						 
						
							2019-10-31 10:54:57 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Rezanezhad, Vahid 
								
							 
						 
						
							
							
							
							
								
							
							
								719824f19d 
								
							 
						 
						
							
							
								
								Update main.py  
							
							
							
						 
						
							2019-10-30 13:37:54 +01:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								f94511a1d8 
								
							 
						 
						
							
							
								
								Merge branch 'master' of code.dev.sbb.berlin:qurator/mono-repo  
							
							
							
						 
						
							2019-10-25 18:11:17 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								4f28cd905a 
								
							 
						 
						
							
							
								
								🧹  sbb_textline_detector: Do not create empty/space-only TextEquivs  
							
							... 
							
							
							
							ocrd_tesserocr or ocrd_cis complain about already existing text if
empty/space-only TextEquivs elements exist after segmentation. Also, it
does not make sense to create them in a segmentation step.
Fix by removing the code generating the elements. 
							
						 
						
							2019-10-25 18:08:31 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Rezanezhad, Vahid 
								
							 
						 
						
							
							
							
							
								
							
							
								00929ab391 
								
							 
						 
						
							
							
								
								Update main.py  
							
							
							
						 
						
							2019-10-25 14:39:37 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								f0dd955606 
								
							 
						 
						
							
							
								
								Merge branch 'master' of code.dev.sbb.berlin:qurator/mono-repo  
							
							
							
						 
						
							2019-10-25 14:20:44 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								2528573b4f 
								
							 
						 
						
							
							
								
								✨  sbb_textline_detector: Allow PAGE input in OCR-D interface  
							
							... 
							
							
							
							Previous OCR-D processors may output PAGE files instead of image files.
Resolve images file from PAGE files if necessary. 
							
						 
						
							2019-10-25 14:16:09 +02:00 
							
								 
							
							
								 
							
						 
					 
				
					
						
							
								
								
									Rezanezhad, Vahid 
								
							 
						 
						
							
							
							
							
								
							
							
								d8e04e3de4 
								
							 
						 
						
							
							
								
								memory leakage is removed. New deskewing methid is integrated.  
							
							
							
						 
						
							2019-10-25 14:07:36 +02:00