caltechlibrary
diff --git a/‎caltechdata_api/__init__.py‎
Lines changed: 3 additions & 5 deletions b/‎caltechdata_api/__init__.py‎
Lines changed: 3 additions & 5 deletions
diff --git a/‎caltechdata_api/caltechdata_edit.py‎
Lines changed: 5 additions & 3 deletions b/‎caltechdata_api/caltechdata_edit.py‎
Lines changed: 5 additions & 3 deletions
diff --git a/‎caltechdata_api/caltechdata_write.py‎
Lines changed: 5 additions & 2 deletions b/‎caltechdata_api/caltechdata_write.py‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎caltechdata_api/customize_schema.py‎
Lines changed: 122 additions & 36 deletions b/‎caltechdata_api/customize_schema.py‎
Lines changed: 122 additions & 36 deletions
@@ -1,8 +1,6 @@
-from .caltechdata_write import caltechdata_write
-from .caltechdata_write import send_s3
-from .caltechdata_edit import caltechdata_add
-from .caltechdata_edit import caltechdata_edit
-from .caltechdata_edit import caltechdata_unembargo
+from .caltechdata_edit import (caltechdata_add, caltechdata_edit,
+                               caltechdata_unembargo)
+from .caltechdata_write import caltechdata_write, send_s3
 from .customize_schema import customize_schema
 from .decustomize_schema import decustomize_schema
 from .get_metadata import get_metadata
@@ -1,7 +1,9 @@
+import copy
+import json
+
 from requests import session
-import json, copy
-from caltechdata_api import customize_schema
-from caltechdata_api import send_s3
+
+from caltechdata_api import customize_schema, send_s3
 
 
 def caltechdata_unembargo(token, ids, production=False):
 
@@ -1,7 +1,10 @@
+import copy
+import json
+import os
+
 from requests import session
+
 from caltechdata_api import customize_schema
-import json, copy
-import os
 
 
 def send_s3(filepath, token, production=False):
 
@@ -1,19 +1,19 @@
-# Convert a DataCite 4 standard schema json record to the customized internal
+# Convert a DataCite 4 or 4.3 standard schema json record to the customized internal
 # schema used by TIND in CaltechDATA
-import json
 import argparse
+import json
 
 
-def customize_schema(json_record):
+def customize_schema(json_record, schema='4'):
 
-    # Extract subjects to single string
-    if "subjects" in json_record:
-        subjects = json_record["subjects"]
-        subs = []
-        for s in subjects:
-            subs.append(s["subject"])
-        json_record["subjects"] = subs
+    if schema == '4':
+        return customize_schema_4(json_record)
+    elif schema == '43':
+        return customize_schema_43(json_record)
+    else:
+        raise ValueError(f'Error: schema {schema} not defined')
 
+def customize_schema_4(json_record):
     # Extract identifier and label as DOI
     if "identifier" in json_record:
         identifier = json_record["identifier"]["identifier"]
@@ -22,31 +22,6 @@ def customize_schema(json_record):
         del json_record["identifier"]
         # will delete other ideintifiers in file
 
-    # Extract description
-    if "descriptions" in json_record:
-        for d in json_record["descriptions"]:
-            d["descriptionValue"] = d["description"]
-            del d["description"]
-
-    # Extract title
-    if "titles" in json_record:
-        titles = json_record["titles"]
-        for t in titles:
-            if "titleType" not in t:
-                json_record["title"] = t["title"]
-        del json_record["titles"]
-
-    # Language - only translating english
-    if "language" in json_record:
-        if json_record["language"] == "en":
-            json_record["language"] = "eng"
-
-    # Change related identifier labels
-    if "relatedIdentifiers" in json_record:
-        for listing in json_record["relatedIdentifiers"]:
-            listing["relatedIdentifierRelation"] = listing.pop("relationType")
-            listing["relatedIdentifierScheme"] = listing.pop("relatedIdentifierType")
-
     # change author formatting
     # We're dropping URIs
     if "creators" in json_record:
@@ -102,6 +77,117 @@ def customize_schema(json_record):
             newc.append(new)
         json_record["contributors"] = newc
 
+
+def customize_schema_43(json_record):
+    # Extract identifiers and label as DOI or alternativeIdentifiers
+    if "identifiers" in json_record:
+        alt = []
+        for identifier = json_record["identifiers"]:
+            if identifier['identifierType'] == 'DOI':
+                json_record["doi"] = identifier
+            else:
+                alt.append(identifier)
+        if alt != []:        
+            json_record['alternativeIdentifiers']  = alt 
+        del json_record["identifier"]
+
+    # change author formatting
+    # We're dropping URIs
+    if "creators" in json_record:
+        authors = json_record["creators"]
+        newa = []
+        for a in authors:
+            new = {}
+            if "affiliations" in a:
+                affiliation = []
+                for aff in a["affiliations"]:
+                    name = {}
+                    name['affiliation'] = a["name"]
+                    if 'ROR' in a:
+                        name['ROR'] = a['ROR']
+            new["authorAffiliation"] = affiliation
+            new["authorName"] = a["name"]
+            if "nameIdentifiers" in a:
+                idn = []
+                for n in a["nameIdentifiers"]:
+                    idn.append(
+                        {
+                            "authorIdentifier": n["nameIdentifier"],
+                            "authorIdentifierScheme": n["nameIdentifierScheme"],
+                        }
+                    )
+                new["authorIdentifiers"] = idn
+            newa.append(new)
+        json_record["authors"] = newa
+        del json_record["creators"]
+
+    # strip creator URI
+    if "contributors" in json_record:
+        newc = []
+        for c in json_record["contributors"]:
+            new = {}
+            if "nameIdentifiers" in c:
+                idn = []
+                for n in c["nameIdentifiers"]:
+                    idn.append(
+                        {
+                            "contributorIdentifier": n["nameIdentifier"],
+                            "contributorIdentifierScheme": n["nameIdentifierScheme"],
+                        }
+                    )
+                new["contributorIdentifiers"] = idn
+            if "affiliations" in a:
+                affiliation = []
+                for aff in a["affiliations"]:
+                    name = {}
+                    name['affiliation'] = a["name"]
+                    if 'ROR' in a:
+                        name['ROR'] = a['ROR']
+            new["contributorAffiliation"] = affiliation
+            new["contributorName"] = c["name"]
+            if "contributorType" in c:
+                new["contributorType"] = c["contributorType"]
+            if "contributorEmail" in c:
+                new["contributorEmail"] = c["contributorEmail"]
+            newc.append(new)
+        json_record["contributors"] = newc
+
+
+def customize_standard(json_record)
+
+    # Extract subjects to single string
+    if "subjects" in json_record:
+        subjects = json_record["subjects"]
+        subs = []
+        for s in subjects:
+            subs.append(s["subject"])
+        json_record["subjects"] = subs
+
+    # Extract description
+    if "descriptions" in json_record:
+        for d in json_record["descriptions"]:
+            d["descriptionValue"] = d["description"]
+            del d["description"]
+
+    # Extract title
+    if "titles" in json_record:
+        titles = json_record["titles"]
+        for t in titles:
+            if "titleType" not in t:
+                json_record["title"] = t["title"]
+        del json_record["titles"]
+
+    # Language - only translating english
+    if "language" in json_record:
+        if json_record["language"] == "en":
+            json_record["language"] = "eng"
+
+    # Change related identifier labels
+    if "relatedIdentifiers" in json_record:
+        for listing in json_record["relatedIdentifiers"]:
+            listing["relatedIdentifierRelation"] = listing.pop("relationType")
+            listing["relatedIdentifierScheme"] = listing.pop("relatedIdentifierType")
+
     # format
     if "formats" in json_record:
         json_record["format"] = json_record.pop("formats")
@@ -177,7 +263,7 @@ def customize_schema(json_record):
     # Read in from file for demo purposes
 
     parser = argparse.ArgumentParser(
-        description="customize_schema converts a DataCite 4 standard json record\
+        description="customize_schema converts a DataCite 4 or 4.3 standard json record\
                 to TIND customized internal schema in CaltechDATA"
     )
     parser.add_argument("json_files", nargs="+", help="json file name")