diff --git a/.gitignore b/.gitignore index f785ff4..79203a2 100644 --- a/.gitignore +++ b/.gitignore @@ -1,3 +1,7 @@ +# Output files +aardvark/* +!aardvark/.gitkeep + # Byte-compiled / optimized / DLL files __pycache__/ *.py[cod] diff --git a/1.0-to-aardvark.py b/1.0-to-aardvark.py index 4603935..f658e58 100644 --- a/1.0-to-aardvark.py +++ b/1.0-to-aardvark.py @@ -32,6 +32,13 @@ def schema_update(filepath): for old_schema, new_schema in crosswalk.items(): if old_schema in data: data[new_schema] = data.pop(old_schema) + + # Change the metadata type: + data["gbl_mdVersion_s"] = "Aardvark" + + # Remove geoblacklight_version + if "geoblacklight_version" in data: + data.pop("geoblacklight_version") # check for multi-valued fields - if so, convert its value to an array data = string2array(data) diff --git a/aardvark/.gitkeep b/aardvark/.gitkeep new file mode 100644 index 0000000..e69de29 diff --git a/crosswalk.csv b/crosswalk.csv index eb93a72..393e62b 100644 --- a/crosswalk.csv +++ b/crosswalk.csv @@ -20,5 +20,4 @@ dct_references_s,dct_references_s layer_slug_s,id dc_identifier_s,dct_identifier_sm layer_modified_dt,gbl_mdModified_dt -geoblacklight_version,gbl_mdVersion_s -suppressed_b,gbl_suppressed_b \ No newline at end of file +suppressed_b,gbl_suppressed_b