11a04916f3 
								
							 
						 
						
							
							
								
								🐛  Write mods_info Parquet file again  
							
							 
							
							
							
						 
						
							2024-11-28 18:27:39 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								abb20b8ba9 
								
							 
						 
						
							
							
								
								🐛  Add multivolume type 'multivolume_manuscript'  
							
							 
							
							
							
						 
						
							2024-11-28 14:25:27 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								8ee4c3d0bc 
								
							 
						 
						
							
							
								
								🐛  Normalize structure type names to lower case  
							
							 
							
							
							
						 
						
							2024-11-27 19:56:36 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								939967edc8 
								
							 
						 
						
							
							
								
								🐛  De-couple mods_info from page_info  
							
							 
							
							
							
						 
						
							2024-11-27 19:05:05 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								11d7b012ec 
								
							 
						 
						
							
							
								
								🐛  Leave tqdm progress bar to avoid confusion through other left-over progress bars  
							
							 
							
							
							
						 
						
							2024-11-27 19:03:35 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								22b62d7a2f 
								
							 
						 
						
							
							
								
								🐛  Remove output files before writing them again  
							
							 
							
							
							
						 
						
							2024-11-27 18:48:56 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								eeaad03686 
								
							 
						 
						
							
							
								
								🚧  Avoid nested quotes for Python < 3.12  
							
							 
							
							
							
						 
						
							2024-11-27 16:38:18 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								b385f27391 
								
							 
						 
						
							
							
								
								🚧  Write out page_info  
							
							 
							
							
							
						 
						
							2024-11-27 14:43:42 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								a1390699d4 
								
							 
						 
						
							
							
								
								🚧  Use a temporary sqlite db  
							
							 
							
							
							
						 
						
							2024-11-26 16:27:43 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								8d6b97f6b3 
								
							 
						 
						
							
							
								
								🐛  Fix typo in XlsxWriter dependency  
							
							 
							
							
							
						 
						
							2024-08-02 05:55:47 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								7122f0265f 
								
							 
						 
						
							
							
								
								Remove direct CSV/Excel support  
							
							 
							
							... 
							
							
							
							Remove direct CVS/Excel support from the CLI; README now has instructions to convert.
Closes gh-40. 
							
						 
						
							2024-07-31 11:09:34 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								a1f333f4a4 
								
							 
						 
						
							
							
								
								🐛  Fix converting/writing out per-page information (e.g. structure information)  
							
							 
							
							
							
						 
						
							2024-07-31 10:27:46 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								1bf86bfb4c 
								
							 
						 
						
							
							
								
								✔ Test on Python 3.12  
							
							 
							
							
							
						 
						
							2024-07-29 07:02:59 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								191867cdef 
								
							 
						 
						
							
							
								
								⚙ Make saving per-page information optional  
							
							 
							
							
							
						 
						
							2024-07-29 06:08:01 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								dd4febf24d 
								
							 
						 
						
							
							
								
								🚧  Write a Parquet file  
							
							 
							
							
							
						 
						
							2024-07-27 12:57:33 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								03d86ce68a 
								
							 
						 
						
							
							
								
								🐛  Fix tests  
							
							 
							
							
							
						 
						
							2024-07-25 13:26:12 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								ae650f70a2 
								
							 
						 
						
							
							
								
								⚙ Migrate to pyproject.toml  
							
							 
							
							
							
						 
						
							2024-07-25 13:20:18 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								187da054b0 
								
							 
						 
						
							
							
								
								⚙ Migrate to pyproject.toml  
							
							 
							
							
							
						 
						
							2024-07-25 12:45:22 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								acd9c5cd4b 
								
							 
						 
						
							
							
								
								Merge branch 'feat/page_info' of  https://github.com/qurator-spk/mods4pandas  into feat/page_info  
							
							 
							
							
							
						 
						
							2024-07-25 12:01:49 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								515d39bb1d 
								
							 
						 
						
							
							
								
								🚧  Workaround NumPy incompatibility by requiring < 2  
							
							 
							
							
							
						 
						
							2024-07-25 12:01:35 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								e9fca0f563 
								
							 
						 
						
							
							
								
								🐛  mods4pandas: Handle MultiVolumeWork (differently spelled type cp. to before) without structMap TYPE='PHYSICAL'  
							
							 
							
							
							
						 
						
							2023-12-12 13:33:05 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								b8a2872582 
								
							 
						 
						
							
							
								
								🐛  mods4pandas: Handle periodical without structMap TYPE='PHYSICAL'  
							
							 
							
							
							
						 
						
							2023-12-12 13:13:23 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								6226618f40 
								
							 
						 
						
							
							
								
								🐛  mods4pandas: Handle multivolume_work without structMap TYPE='PHYSICAL'  
							
							 
							
							
							
						 
						
							2023-12-12 12:34:24 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								0acaa83163 
								
							 
						 
						
							
							
								
								⚡  MUse relative predicate  
							
							 
							
							
							
						 
						
							2023-12-09 12:48:07 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								8fc4eeeb3b 
								
							 
						 
						
							
							
								
								⚡  Make get_sets_file faster by using a lookup table  
							
							 
							
							
							
						 
						
							2023-12-09 12:05:29 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								912e5d2b4a 
								
							 
						 
						
							
							
								
								⚡  Make get_struct_log faster by using precise predicates  
							
							 
							
							
							
						 
						
							2023-12-09 11:40:45 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								448639b05b 
								
							 
						 
						
							
							
								
								⚡  Make gettstruct_log faster by using precise predicates  
							
							 
							
							
							
						 
						
							2023-12-09 11:35:24 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								1dac77a2f5 
								
							 
						 
						
							
							
								
								⚡  Make gett_struct_log faster by using find(all) instead of xpath()  
							
							 
							
							
							
						 
						
							2023-12-09 10:36:55 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								90c60ebb80 
								
							 
						 
						
							
							
								
								⚡  Make get_mets_file aa lot faster by using find() instead of xpath()  
							
							 
							
							
							
						 
						
							2023-12-09 10:24:38 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								16a3a3bcc8 
								
							 
						 
						
							
							
								
								✔ Fix tests on Python 3.8 by backporting removeprefix  
							
							 
							
							
							
						 
						
							2023-12-09 09:21:10 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								8d0dc72ca2 
								
							 
						 
						
							
							
								
								✔ Enable/document profiling  
							
							 
							
							
							
						 
						
							2023-12-08 16:28:45 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								8c269b35a4 
								
							 
						 
						
							
							
								
								✔ Test creation of page_info  
							
							 
							
							
							
						 
						
							2023-12-08 15:58:59 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								f243dd204a 
								
							 
						 
						
							
							
								
								✒ Add comments for populating type indicator variables  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:15 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								ddffb76fb6 
								
							 
						 
						
							
							
								
								🐛  Fix getting parent elements if necessary  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:15 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								c5332ae80d 
								
							 
						 
						
							
							
								
								🚧  Write out page_info  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:15 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								e51fa5750f 
								
							 
						 
						
							
							
								
								🧹  Remove debug noise  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:15 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								b8980bbf25 
								
							 
						 
						
							
							
								
								🧹  page_info: Name structMap type columns a bit more consistently  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								3ec0f8c62a 
								
							 
						 
						
							
							
								
								✔ CircleCI: Don't test on Python 3.12 yet  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								e1238259b7 
								
							 
						 
						
							
							
								
								✔ CircleCI: Don't test on EOL Python 3.6/3.7, but test on 3.11/3.12  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								3d920f2b50 
								
							 
						 
						
							
							
								
								🐛  Use List/Dict for type annotations to support ye olde Python  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								968572168e 
								
							 
						 
						
							
							
								
								🧹  Extract a function to convert list[dict] to a DataFrame  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								5c2dfa8505 
								
							 
						 
						
							
							
								
								✔ Add another (large) METS example  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:14 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								889d36f0d4 
								
							 
						 
						
							
							
								
								✨  page_info: Retrieve filenames + structMap types  
							
							 
							
							
							
						 
						
							2023-11-28 15:47:13 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								dd3943eaf6 
								
							 
						 
						
							
							
								
								🧹  .gitignore pyenv's .python-version  
							
							 
							
							
							
						 
						
							2023-11-28 15:45:48 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								a769d89d0a 
								
							 
						 
						
							
							
								
								🎨  Rename test_modstool → test_mod4pandas  
							
							 
							
							
							
						 
						
							2023-11-10 17:58:53 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								5238c0600b 
								
							 
						 
						
							
							
								
								Merge branch 'master' of  https://github.com/qurator-spk/mods4pandas  
							
							 
							
							
							
						 
						
							2023-11-10 17:57:46 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								7def0bccaf 
								
							 
						 
						
							
							
								
								🎨  Reformat test METS/MOTS files (to make them easier to read)  
							
							 
							
							
							
						 
						
							2023-11-10 17:57:37 +01:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								100b2a5e6c 
								
							 
						 
						
							
							
								
								🐛   Fix mods:relatedItem with mods:recordIdentifier source=dnb-ppn  
							
							 
							
							... 
							
							
							
							mods:relatedItem may have a mods:recordIdentifier with source="dnb-ppn".
This may happen for digitized works that have their original work in
another library and use a DNB PPN there.
Fixes gh-22. 
							
						 
						
							2023-04-17 19:21:43 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								4e7b8ed642 
								
							 
						 
						
							
							
								
								✨  Convert mods:relatedItem for types original and host  
							
							 
							
							... 
							
							
							
							Fixes gh-21. 
							
						 
						
							2023-04-14 12:53:31 +02:00  
						
						
							 
							
							
							
								 
							 
							
						 
					 
				
					
						
							
						 
						
							
							
							
							
								
							
							
								6d8ba871eb 
								
							 
						 
						
							
							
								
								🎨  Fix link to CircleCI project  
							
							 
							
							
							
						 
						
							2022-07-04 19:34:13 +02:00