mirror of
				https://github.com/qurator-spk/ocrd-galley.git
				synced 2025-10-31 11:14:12 +01:00 
			
		
		
		
	Refactor: Extract functions for the steps
This commit is contained in:
		
							parent
							
								
									a2d547b857
								
							
						
					
					
						commit
						c207859bcd
					
				
					 1 changed files with 27 additions and 19 deletions
				
			
		|  | @ -13,27 +13,35 @@ remove_filegrp() { | |||
|     -d "//mets:fileGrp[@USE='$filegrp_use']" $mets | ||||
| } | ||||
| 
 | ||||
| 
 | ||||
| ocrd_typegroups_classifier_parameters=' | ||||
| { | ||||
| do_fontident() { | ||||
|   ocrd_typegroups_classifier_parameters=' | ||||
|   { | ||||
|     "network": "/home/mike/devel/OCR-D/monorepo/ocrd_typegroups_classifier/ocrd_typegroups_classifier/models/classifier.tgc", | ||||
|     "stride":143 | ||||
| }' | ||||
| remove_filegrp OCR-D-FONTIDENT mets.xml | ||||
| ocrd-typegroups-classifier -l DEBUG \ | ||||
|   }' | ||||
|   remove_filegrp OCR-D-FONTIDENT mets.xml | ||||
|   ocrd-typegroups-classifier -l DEBUG \ | ||||
|     -m mets.xml -I OCR-D-IMG -O OCR-D-FONTIDENT \ | ||||
|     -p <(echo $ocrd_typegroups_classifier_parameters) | ||||
| # XXX does DEFAULT have any meaning? /buerger_gedichte_1778.ocrd does not have | ||||
| #     any DEFAULT, yet -I DEFAULT seems to work for ocrd-typegroups-classifier | ||||
| #ocrd workspace validate mets.xml | ||||
| # XXX <error>Unspecified USE category 'FONTIDENT' in fileGrp 'OCR-D-FONTIDENT'</error> | ||||
| # XXX <error>File 'OCR-D-FONTIDENT_OCR-D-IMG_0002' does not manifest any physical page.</error> | ||||
| # XXX <notice>Won't download remote image <OCR-D-IMG/OCR-D-IMG_0002></notice> | ||||
|   # XXX does DEFAULT have any meaning? /buerger_gedichte_1778.ocrd does not have | ||||
|   #     any DEFAULT, yet -I DEFAULT seems to work for ocrd-typegroups-classifier | ||||
|   #ocrd workspace validate mets.xml | ||||
|   # XXX <error>Unspecified USE category 'FONTIDENT' in fileGrp 'OCR-D-FONTIDENT'</error> | ||||
|   # XXX <error>File 'OCR-D-FONTIDENT_OCR-D-IMG_0002' does not manifest any physical page.</error> | ||||
|   # XXX <notice>Won't download remote image <OCR-D-IMG/OCR-D-IMG_0002></notice> | ||||
| } | ||||
| 
 | ||||
| remove_filegrp OCR-D-SEG-LINE mets.xml | ||||
| ocrd-tesserocr-segment-line -l DEBUG \ | ||||
| do_linesegmentation() { | ||||
|   remove_filegrp OCR-D-SEG-LINE mets.xml | ||||
|   ocrd-tesserocr-segment-line -l DEBUG \ | ||||
|     -m mets.xml -I OCR-D-IMG -O OCR-D-SEG-LINE | ||||
| #ocrd workspace validate mets.xml | ||||
|   #ocrd workspace validate mets.xml | ||||
| } | ||||
| 
 | ||||
| 
 | ||||
| do_fontident | ||||
| do_linesegmentation | ||||
| 
 | ||||
| 
 | ||||
| 
 | ||||
| # vim:tw=120: | ||||
|  |  | |||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue