c5332ae80d 
								
							 
						 
						
							
							
								
								🚧  Write out page_info  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:15 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								e51fa5750f 
								
							 
						 
						
							
							
								
								🧹  Remove debug noise  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:15 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								b8980bbf25 
								
							 
						 
						
							
							
								
								🧹  page_info: Name structMap type columns a bit more consistently  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								3ec0f8c62a 
								
							 
						 
						
							
							
								
								✔ CircleCI: Don't test on Python 3.12 yet  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								e1238259b7 
								
							 
						 
						
							
							
								
								✔ CircleCI: Don't test on EOL Python 3.6/3.7, but test on 3.11/3.12  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								3d920f2b50 
								
							 
						 
						
							
							
								
								🐛  Use List/Dict for type annotations to support ye olde Python  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								968572168e 
								
							 
						 
						
							
							
								
								🧹  Extract a function to convert list[dict] to a DataFrame  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								5c2dfa8505 
								
							 
						 
						
							
							
								
								✔ Add another (large) METS example  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								889d36f0d4 
								
							 
						 
						
							
							
								
								✨  page_info: Retrieve filenames + structMap types  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:13 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								dd3943eaf6 
								
							 
						 
						
							
							
								
								🧹  .gitignore pyenv's .python-version  
							
							 
							
							
							
						 
						
							2023-11-28 15:45:48 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								a769d89d0a 
								
							 
						 
						
							
							
								
								🎨  Rename test_modstool → test_mod4pandas  
							
							 
							
							
							
						 
						
							2023-11-10 17:58:53 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								5238c0600b 
								
							 
						 
						
							
							
								
								Merge branch 'master' of  https://github.com/qurator-spk/mods4pandas  
							
							 
							
							
							
						 
						
							2023-11-10 17:57:46 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								7def0bccaf 
								
							 
						 
						
							
							
								
								🎨  Reformat test METS/MOTS files (to make them easier to read)  
							
							 
							
							
							
						 
						
							2023-11-10 17:57:37 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								100b2a5e6c 
								
							 
						 
						
							
							
								
								🐛   Fix mods:relatedItem with mods:recordIdentifier source=dnb-ppn  
							
							 
							
							... 
							
							
							
							mods:relatedItem may have a mods:recordIdentifier with source="dnb-ppn".
This may happen for digitized works that have their original work in
another library and use a DNB PPN there.
Fixes gh-22. 
							
						 
						
							2023-04-17 19:21:43 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								4e7b8ed642 
								
							 
						 
						
							
							
								
								✨  Convert mods:relatedItem for types original and host  
							
							 
							
							... 
							
							
							
							Fixes gh-21. 
							
						 
						
							2023-04-14 12:53:31 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								6d8ba871eb 
								
							 
						 
						
							
							
								
								🎨  Fix link to CircleCI project  
							
							 
							
							
							
						 
						
							2022-07-04 19:34:13 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								1dfdacc5a5 
								
							 
						 
						
							
							
								
								🎨  Rename the Python package to mods4pandas  
							
							 
							
							
							
						 
						
							2022-07-04 19:28:34 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								9c0dce7a04 
								
							 
						 
						
							
							
								
								🎨  Rename modstool to mods4pandas in the last code parts  
							
							 
							
							
							
						 
						
							2022-07-04 19:26:41 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								03d2fc9670 
								
							 
						 
						
							
							
								
								🎨  Rename qurator.modstool to qurator.mods4pandas  
							
							 
							
							
							
						 
						
							2022-07-04 19:24:33 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								3c2e59f0ed 
								
							 
						 
						
							
							
								
								🎨  Rename qurator.modstool to qurator.mods4pandas  
							
							 
							
							
							
						 
						
							2022-07-04 19:11:10 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								1d2c5e2d10 
								
							 
						 
						
							
							
								
								🎨  Rename modstool.py to mods4pandas.py  
							
							 
							
							
							
						 
						
							2022-07-04 18:58:39 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								c48084de93 
								
							 
						 
						
							
							
								
								➡️  Rename modstool script to mods4pandas  
							
							 
							
							
							
						 
						
							2022-06-29 17:25:39 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								3121621e14 
								
							 
						 
						
							
							
								
								📝  README: Fix typo  
							
							 
							
							
							
						 
						
							2022-06-21 13:16:10 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								83befba3ab 
								
							 
						 
						
							
							
								
								📝  README: Fix markdown  
							
							 
							
							
							
						 
						
							2022-06-21 13:15:14 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								f507370729 
								
							 
						 
						
							
							
								
								📝  README: Add some documentation for alto4pandas  
							
							 
							
							
							
						 
						
							2022-06-21 13:12:44 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								6f2265a619 
								
							 
						 
						
							
							
								
								✔️  Add test data  
							
							 
							
							
							
						 
						
							2022-06-21 12:54:26 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								c803ce0907 
								
							 
						 
						
							
							
								
								✨  Count all alto:String elements with TAGREFS attribute  
							
							 
							
							
							
						 
						
							2022-06-17 17:59:34 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								a40716a320 
								
							 
						 
						
							
							
								
								✨  ALTO: Count alto:Tags  
							
							 
							
							
							
						 
						
							2022-06-17 17:32:17 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								de50f13043 
								
							 
						 
						
							
							
								
								🚧  alto4pandas: Determine ALTO namespace for group  
							
							 
							
							
							
						 
						
							2022-06-17 17:01:07 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								53a8db955c 
								
							 
						 
						
							
							
								
								🐛  Consistently use lxml for etree  
							
							 
							
							
							
						 
						
							2022-06-16 19:42:44 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								a2fb3ee387 
								
							 
						 
						
							
							
								
								Merge branch 'feat/alto'  
							
							 
							
							
							
						 
						
							2022-06-16 19:29:44 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								21f906ec7d 
								
							 
						 
						
							
							
								
								✨  Rename altotool to alto4pandas  
							
							 
							
							... 
							
							
							
							See gh-15. 
							
						 
						
							2022-06-16 19:27:59 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								3d2e53f739 
								
							 
						 
						
							
							
								
								✨  ALTO: Extract namespace == ALTO version  
							
							 
							
							
							
						 
						
							2022-06-08 18:25:33 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								8285bdb423 
								
							 
						 
						
							
							
								
								🚧  ALTO: Calculate more descriptive statistics for String@WC  
							
							 
							
							
							
						 
						
							2022-05-23 19:45:44 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								aa4e8e290d 
								
							 
						 
						
							
							
								
								🚧  ALTO: Move xpath_statistics to TagGroup class  
							
							 
							
							
							
						 
						
							2022-05-23 19:39:21 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								9246519162 
								
							 
						 
						
							
							
								
								🚧  ALTO: Extract a function to calculate statistics on xpath expressions  
							
							 
							
							
							
						 
						
							2022-05-23 19:33:54 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								e24a846ea2 
								
							 
						 
						
							
							
								
								🚧  ALTO: Calculate mean of String@WC  
							
							 
							
							
							
						 
						
							2022-05-23 19:12:39 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								9b3db1cd1d 
								
							 
						 
						
							
							
								
								✨  ALTO: Support more ALTO versions  
							
							 
							
							
							
						 
						
							2022-05-10 19:32:26 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								937e7d74eb 
								
							 
						 
						
							
							
								
								✨  ALTO: Support more ALTO versions  
							
							 
							
							
							
						 
						
							2022-05-10 18:15:35 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								4bb3379ab1 
								
							 
						 
						
							
							
								
								🐛  Use tqdm's write() instead of logging during scanning  
							
							 
							
							
							
						 
						
							2022-05-10 17:57:36 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								6a549968b5 
								
							 
						 
						
							
							
								
								🐛  Produce a text attribute even if the attribute has no value  
							
							 
							
							
							
						 
						
							2022-05-10 17:47:38 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								c85356bd23 
								
							 
						 
						
							
							
								
								✨  ALTO: Support more ALTO versions  
							
							 
							
							
							
						 
						
							2022-05-10 17:46:50 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								c91c9b1714 
								
							 
						 
						
							
							
								
								✨  ALTO: preProcessingStep/processingAgency/sourceImageInformation etc.  
							
							 
							
							
							
						 
						
							2022-05-10 14:27:39 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								01326050d3 
								
							 
						 
						
							
							
								
								✨  ALTO: Handle PermissionErrors  
							
							 
							
							
							
						 
						
							2022-05-09 18:28:31 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								10b8023dd6 
								
							 
						 
						
							
							
								
								✨  ALTO: Count Layout/Page/* elements  
							
							 
							
							
							
						 
						
							2022-05-06 20:59:51 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								1c62085612 
								
							 
						 
						
							
							
								
								✨  ALTO: Count Layout/Page/* elements  
							
							 
							
							
							
						 
						
							2022-05-06 20:28:55 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								c9737683b1 
								
							 
						 
						
							
							
								
								✨  ALTO: Add Layout/Page's attribute values  
							
							 
							
							
							
						 
						
							2022-05-06 19:59:19 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								102b15ffa9 
								
							 
						 
						
							
							
								
								🧹  Do not duplicate ALTO metadata  
							
							 
							
							
							
						 
						
							2022-05-06 19:36:50 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								6e2e0bd67a 
								
							 
						 
						
							
							
								
								🐛  Fix imports  
							
							 
							
							
							
						 
						
							2022-05-05 11:10:59 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								e86369e76d 
								
							 
						 
						
							
							
								
								🚧  Add support for ALTO Description  
							
							 
							
							
							
						 
						
							2022-05-04 20:02:27 +02:00