5c2dfa8505 
								
							 
						 
						
							
							
								
								✔ Add another (large) METS example  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								889d36f0d4 
								
							 
						 
						
							
							
								
								✨  page_info: Retrieve filenames + structMap types  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:13 +01:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								a769d89d0a 
								
							 
						 
						
							
							
								
								🎨  Rename test_modstool → test_mod4pandas  
							
							 
							
							
							
						 
						
							2023-11-10 17:58:53 +01:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								5238c0600b 
								
							 
						 
						
							
							
								
								Merge branch 'master' of  https://github.com/qurator-spk/mods4pandas  
							
							 
							
							
							
						 
						
							2023-11-10 17:57:46 +01:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								7def0bccaf 
								
							 
						 
						
							
							
								
								🎨  Reformat test METS/MOTS files (to make them easier to read)  
							
							 
							
							
							
						 
						
							2023-11-10 17:57:37 +01:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								100b2a5e6c 
								
							 
						 
						
							
							
								
								🐛   Fix mods:relatedItem with mods:recordIdentifier source=dnb-ppn  
							
							 
							
							... 
							
							
							
							mods:relatedItem may have a mods:recordIdentifier with source="dnb-ppn".
This may happen for digitized works that have their original work in
another library and use a DNB PPN there.
Fixes gh-22. 
							
						 
						
							2023-04-17 19:21:43 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								4e7b8ed642 
								
							 
						 
						
							
							
								
								✨  Convert mods:relatedItem for types original and host  
							
							 
							
							... 
							
							
							
							Fixes gh-21. 
							
						 
						
							2023-04-14 12:53:31 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								9c0dce7a04 
								
							 
						 
						
							
							
								
								🎨  Rename modstool to mods4pandas in the last code parts  
							
							 
							
							
							
						 
						
							2022-07-04 19:26:41 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								3c2e59f0ed 
								
							 
						 
						
							
							
								
								🎨  Rename qurator.modstool to qurator.mods4pandas  
							
							 
							
							
							
						 
						
							2022-07-04 19:11:10 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								1d2c5e2d10 
								
							 
						 
						
							
							
								
								🎨  Rename modstool.py to mods4pandas.py  
							
							 
							
							
							
						 
						
							2022-07-04 18:58:39 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								6f2265a619 
								
							 
						 
						
							
							
								
								✔️  Add test data  
							
							 
							
							
							
						 
						
							2022-06-21 12:54:26 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								c803ce0907 
								
							 
						 
						
							
							
								
								✨  Count all alto:String elements with TAGREFS attribute  
							
							 
							
							
							
						 
						
							2022-06-17 17:59:34 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								a40716a320 
								
							 
						 
						
							
							
								
								✨  ALTO: Count alto:Tags  
							
							 
							
							
							
						 
						
							2022-06-17 17:32:17 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								de50f13043 
								
							 
						 
						
							
							
								
								🚧  alto4pandas: Determine ALTO namespace for group  
							
							 
							
							
							
						 
						
							2022-06-17 17:01:07 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								53a8db955c 
								
							 
						 
						
							
							
								
								🐛  Consistently use lxml for etree  
							
							 
							
							
							
						 
						
							2022-06-16 19:42:44 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								21f906ec7d 
								
							 
						 
						
							
							
								
								✨  Rename altotool to alto4pandas  
							
							 
							
							... 
							
							
							
							See gh-15. 
							
						 
						
							2022-06-16 19:27:59 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								3d2e53f739 
								
							 
						 
						
							
							
								
								✨  ALTO: Extract namespace == ALTO version  
							
							 
							
							
							
						 
						
							2022-06-08 18:25:33 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								8285bdb423 
								
							 
						 
						
							
							
								
								🚧  ALTO: Calculate more descriptive statistics for String@WC  
							
							 
							
							
							
						 
						
							2022-05-23 19:45:44 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								aa4e8e290d 
								
							 
						 
						
							
							
								
								🚧  ALTO: Move xpath_statistics to TagGroup class  
							
							 
							
							
							
						 
						
							2022-05-23 19:39:21 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								9246519162 
								
							 
						 
						
							
							
								
								🚧  ALTO: Extract a function to calculate statistics on xpath expressions  
							
							 
							
							
							
						 
						
							2022-05-23 19:33:54 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								e24a846ea2 
								
							 
						 
						
							
							
								
								🚧  ALTO: Calculate mean of String@WC  
							
							 
							
							
							
						 
						
							2022-05-23 19:12:39 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								9b3db1cd1d 
								
							 
						 
						
							
							
								
								✨  ALTO: Support more ALTO versions  
							
							 
							
							
							
						 
						
							2022-05-10 19:32:26 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								937e7d74eb 
								
							 
						 
						
							
							
								
								✨  ALTO: Support more ALTO versions  
							
							 
							
							
							
						 
						
							2022-05-10 18:15:35 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								4bb3379ab1 
								
							 
						 
						
							
							
								
								🐛  Use tqdm's write() instead of logging during scanning  
							
							 
							
							
							
						 
						
							2022-05-10 17:57:36 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								6a549968b5 
								
							 
						 
						
							
							
								
								🐛  Produce a text attribute even if the attribute has no value  
							
							 
							
							
							
						 
						
							2022-05-10 17:47:38 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								c85356bd23 
								
							 
						 
						
							
							
								
								✨  ALTO: Support more ALTO versions  
							
							 
							
							
							
						 
						
							2022-05-10 17:46:50 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								c91c9b1714 
								
							 
						 
						
							
							
								
								✨  ALTO: preProcessingStep/processingAgency/sourceImageInformation etc.  
							
							 
							
							
							
						 
						
							2022-05-10 14:27:39 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								01326050d3 
								
							 
						 
						
							
							
								
								✨  ALTO: Handle PermissionErrors  
							
							 
							
							
							
						 
						
							2022-05-09 18:28:31 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								10b8023dd6 
								
							 
						 
						
							
							
								
								✨  ALTO: Count Layout/Page/* elements  
							
							 
							
							
							
						 
						
							2022-05-06 20:59:51 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								1c62085612 
								
							 
						 
						
							
							
								
								✨  ALTO: Count Layout/Page/* elements  
							
							 
							
							
							
						 
						
							2022-05-06 20:28:55 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								c9737683b1 
								
							 
						 
						
							
							
								
								✨  ALTO: Add Layout/Page's attribute values  
							
							 
							
							
							
						 
						
							2022-05-06 19:59:19 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								102b15ffa9 
								
							 
						 
						
							
							
								
								🧹  Do not duplicate ALTO metadata  
							
							 
							
							
							
						 
						
							2022-05-06 19:36:50 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								6e2e0bd67a 
								
							 
						 
						
							
							
								
								🐛  Fix imports  
							
							 
							
							
							
						 
						
							2022-05-05 11:10:59 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								e86369e76d 
								
							 
						 
						
							
							
								
								🚧  Add support for ALTO Description  
							
							 
							
							
							
						 
						
							2022-05-04 20:02:27 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								08082d5fe8 
								
							 
						 
						
							
							
								
								✨  Support mods:partName  
							
							 
							
							... 
							
							
							
							Fixes gh-6. 
							
						 
						
							2022-04-07 17:37:08 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								9227575555 
								
							 
						 
						
							
							
								
								🎨  Improve log/output a bit  
							
							 
							
							
							
						 
						
							2022-04-07 16:35:18 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								db79960ba1 
								
							 
						 
						
							
							
								
								✨  Force singleton for shelfLocator  
							
							 
							
							... 
							
							
							
							Very few input sources contain multiple mods:shelfLocator elements
for a mods:Location (illegal according to DFG MODS Anwendungsprofil).
Force a singleton in this case.
Fixes gh-7. 
							
						 
						
							2022-04-07 16:22:41 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								f9e418c460 
								
							 
						 
						
							
							
								
								✨  Optionally output to an Excel .xlsx file  
							
							 
							
							
							
						 
						
							2022-04-06 19:08:38 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								0a9a66c2cc 
								
							 
						 
						
							
							
								
								✨  Optionally output to a CSV file  
							
							 
							
							... 
							
							
							
							Resolves gh-9. 
							
						 
						
							2022-04-06 16:46:48 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								86d1154638 
								
							 
						 
						
							
							
								
								✔️  Add METS tests  
							
							 
							
							
							
						 
						
							2022-04-01 16:05:07 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								9a8f7f69bd 
								
							 
						 
						
							
							
								
								🐛  Handle multiple mods:role  
							
							 
							
							
							
						 
						
							2022-04-01 14:52:54 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								75ff143a25 
								
							 
						 
						
							
							
								
								🐛  modstool: Fix handling multiple <mods:language>  
							
							 
							
							... 
							
							
							
							There may be multiple <mods:language> tags with mods:languageTerm children,
that should be merged into one language_languageTerm column 
							
						 
						
							2022-04-01 14:02:19 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								73333ea2e2 
								
							 
						 
						
							
							
								
								⚡  Include METS fileGrp counts  
							
							 
							
							
							
						 
						
							2022-03-31 21:03:58 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								93ce1505c4 
								
							 
						 
						
							
							
								
								✨  Handle namePart + nameIdentifier  
							
							 
							
							
							
						 
						
							2022-03-31 18:57:35 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								d885d6bfa2 
								
							 
						 
						
							
							
								
								🤪  modstool: Fiddle with the damn packaging/namespace so that stuff works  
							
							 
							
							
							
						 
						
							2019-08-29 16:15:48 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								5773b9c9b1 
								
							 
						 
						
							
							
								
								🐛  modstool: Handle multiple scriptTerms per language correctly  
							
							 
							
							
							
						 
						
							2019-08-29 15:42:13 +02:00  
						
						
							 
							
							
							
								 
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								9b8aef12e1 
								
							 
						 
						
							
							
								
								🠒 Move modstool into its own subdirectory  
							
							 
							
							
							
						 
						
							2019-08-28 16:18:39 +02:00