caltechlibrary
diff --git a/‎caltechdata_api/caltechdata_edit.py
Lines changed: 31 additions & 36 deletions b/‎caltechdata_api/caltechdata_edit.py
Lines changed: 31 additions & 36 deletions
diff --git a/‎caltechdata_api/caltechdata_write.py
Lines changed: 53 additions & 51 deletions b/‎caltechdata_api/caltechdata_write.py
Lines changed: 53 additions & 51 deletions
@@ -1,25 +1,23 @@
 from requests import session
-import json,copy
+import json, copy
 from caltechdata_api import customize_schema
 from caltechdata_api import send_s3
 
-def caltechdata_edit(token,ids,metadata={},files={},delete={},production=False):
-    '''Including files will only replaces files if they have the same name
+
+def caltechdata_edit(token, ids, metadata={}, files={}, delete={}, production=False):
+    """Including files will only replaces files if they have the same name
     The delete option will delete any existing files with a given file extension
-    There are more file operations that could be implemented'''
+    There are more file operations that could be implemented"""
 
-    #If files is a string - change to single value array
+    # If files is a string - change to single value array
     if isinstance(files, str) == True:
         files = [files]
     if isinstance(ids, int):
         ids = [str(ids)]
     if isinstance(ids, str):
         ids = [ids]
 
-    headers = {
-        'Authorization' : 'Bearer %s' % token,
-        'Content-type': 'application/json'
-    }
+    headers = {"Authorization": "Bearer %s" % token, "Content-type": "application/json"}
 
     if production == True:
         url = "https://data.caltech.edu/submit/api/edit/"
@@ -32,7 +30,7 @@ def caltechdata_edit(token,ids,metadata={},files={},delete={},production=False):
         metadata = customize_schema.customize_schema(copy.deepcopy(metadata))
 
     for idv in ids:
-        metadata['id'] = idv
+        metadata["id"] = idv
 
         if files:
             # Files to delete
@@ -41,79 +39,76 @@ def caltechdata_edit(token,ids,metadata={},files={},delete={},production=False):
             existing = c.get(api_url + idv)
             file_info = existing.json()["metadata"]
             fids = []
-            for f in files: #Check if new files match existing
-                if 'electronic_location_and_access' in file_info:
+            for f in files:  # Check if new files match existing
+                if "electronic_location_and_access" in file_info:
                     for ex in file_info["electronic_location_and_access"]:
-                        name = ex['electronic_name'][0]
-                        fu = ex['uniform_resource_identifier'].split('/')[-2]
+                        name = ex["electronic_name"][0]
+                        fu = ex["uniform_resource_identifier"].split("/")[-2]
                         if name == f:
                             fids.append(fu)
                         for d in delete:
                             if name == d:
                                 fids.append(fu)
-                            if name.split('.')[-1] == d:
+                            if name.split(".")[-1] == d:
                                 fids.append(fu)
             if len(fids) > 0:
-                fjson = {'delete': fids}
+                fjson = {"delete": fids}
 
             # upload new
             print(files)
             fileinfo = [send_s3(f, token, production) for f in files]
 
-            fjson['new'] = fileinfo
-            metadata['files'] = fjson
+            fjson["new"] = fileinfo
+            metadata["files"] = fjson
 
-        dat = json.dumps({'record': metadata})
+        dat = json.dumps({"record": metadata})
 
-        #outf = open('out.json','w')
-        #outf.write(dat)
+        # outf = open('out.json','w')
+        # outf.write(dat)
 
         c = session()
         response = c.post(url, headers=headers, data=dat)
         print(response.text)
 
-def caltechdata_add(token,ids,metadata={},files={},production=False):
-    '''Adds file'''
 
-    #If files is a string - change to single value array
+def caltechdata_add(token, ids, metadata={}, files={}, production=False):
+    """Adds file"""
+
+    # If files is a string - change to single value array
     if isinstance(ids, int):
         ids = [str(ids)]
     if isinstance(ids, str):
         ids = [ids]
 
     if production == True:
         url = "https://data.caltech.edu/submit/api/edit/"
-        api_url = "https://data.caltech.edu/api/record/"    
+        api_url = "https://data.caltech.edu/api/record/"
     else:
         url = "https://cd-sandbox.tind.io/submit/api/edit/"
         api_url = "https://cd-sandbox.tind.io/api/record/"
 
-    headers = {
-        'Authorization' : 'Bearer %s' % token,
-        'Content-type': 'application/json'
-    }
+    headers = {"Authorization": "Bearer %s" % token, "Content-type": "application/json"}
 
     if metadata:
         metadata = customize_schema.customize_schema(copy.deepcopy(metadata))
 
     fjson = {}
 
     for idv in ids:
-        metadata['id'] = idv
+        metadata["id"] = idv
 
         if files:
             # upload new
             fileinfo = [send_s3(f, token, production) for f in files]
 
-            fjson['new'] = fileinfo
-            metadata['files'] = fjson
+            fjson["new"] = fileinfo
+            metadata["files"] = fjson
 
-        dat = json.dumps({'record': metadata})
+        dat = json.dumps({"record": metadata})
 
-        #outf = open('out.json','w')
-        #outf.write(dat)
+        # outf = open('out.json','w')
+        # outf.write(dat)
 
         c = session()
         response = c.post(url, headers=headers, data=dat)
         return response.text
-
@@ -3,74 +3,78 @@
 import json, copy
 import os
 
-def send_s3(filepath,token,production=False):
-    
+
+def send_s3(filepath, token, production=False):
+
     if production == True:
         s3surl = "https://data.caltech.edu/tindfiles/sign_s3/"
         chkurl = "https://data.caltech.edu/tindfiles/md5_s3"
     else:
         s3surl = "https://cd-sandbox.tind.io/tindfiles/sign_s3/"
         chkurl = "https://cd-sandbox.tind.io/tindfiles/md5_s3"
 
-    headers = { 'Authorization' : 'Bearer %s' % token }
+    headers = {"Authorization": "Bearer %s" % token}
 
     c = session()
 
     print(s3surl)
     print(headers)
-    response = c.get(s3surl,headers=headers)
+    response = c.get(s3surl, headers=headers)
     jresp = response.json()
-    data = jresp['data']
-
-    bucket = jresp['bucket']
-    key = data['fields']['key']
-    policy = data['fields']['policy']
-    aid = data['fields']['AWSAccessKeyId']
-    signature = data['fields']['signature']
-    url = data['url']
-
-    infile = open(filepath,'rb')
-    size = infile.seek(0,2)
-    infile.seek(0,0) #reset at beginning
-
-    s3headers = { 'Host' : bucket+'.s3.amazonaws.com',\
-            'Date' : 'date',\
-            'x-amz-acl' : 'public-read',\
-            'Access-Control-Allow-Origin' : '*' }
-
-    form = ( ( 'key', key )
-            , ("acl", "public-read")
-            , ('AWSAccessKeyID', aid)
-            , ('policy', policy)
-            , ('signature', signature)
-            , ('file', infile ))
+    data = jresp["data"]
+
+    bucket = jresp["bucket"]
+    key = data["fields"]["key"]
+    policy = data["fields"]["policy"]
+    aid = data["fields"]["AWSAccessKeyId"]
+    signature = data["fields"]["signature"]
+    url = data["url"]
+
+    infile = open(filepath, "rb")
+    size = infile.seek(0, 2)
+    infile.seek(0, 0)  # reset at beginning
+
+    s3headers = {
+        "Host": bucket + ".s3.amazonaws.com",
+        "Date": "date",
+        "x-amz-acl": "public-read",
+        "Access-Control-Allow-Origin": "*",
+    }
+
+    form = (
+        ("key", key),
+        ("acl", "public-read"),
+        ("AWSAccessKeyID", aid),
+        ("policy", policy),
+        ("signature", signature),
+        ("file", infile),
+    )
 
     c = session()
-    response = c.post(url,files=form, headers=s3headers)
+    response = c.post(url, files=form, headers=s3headers)
     print(response)
-    if(response.text):
+    if response.text:
         raise Exception(response.text)
 
-    print(chkurl+'/'+bucket+'/'+key+'/')
+    print(chkurl + "/" + bucket + "/" + key + "/")
     print(headers)
-    response = c.get(chkurl+'/'+bucket+'/'+key+'/',headers=headers)
+    response = c.get(chkurl + "/" + bucket + "/" + key + "/", headers=headers)
     print(response)
     md5 = response.json()["md5"]
-    filename = filepath.split('/')[-1]
+    filename = filepath.split("/")[-1]
+
+    fileinfo = {"url": key, "filename": filename, "md5": md5, "size": size}
 
-    fileinfo = { "url" : key,\
-            "filename" : filename,\
-            "md5" : md5,"size" : size }
+    return fileinfo
 
-    return(fileinfo)
 
-def caltechdata_write(metadata,token,files=[],production=False):
+def caltechdata_write(metadata, token, files=[], production=False):
 
-    #If files is a string - change to single value array
+    # If files is a string - change to single value array
     if isinstance(files, str) == True:
         files = [files]
 
-    fileinfo=[]
+    fileinfo = []
 
     for f in files:
         fileinfo.append(send_s3(f, token, production))
@@ -80,20 +84,18 @@ def caltechdata_write(metadata,token,files=[],production=False):
     else:
         url = "https://cd-sandbox.tind.io/submit/api/create/"
 
-    headers = {
-        'Authorization' : 'Bearer %s' % token,
-        'Content-type': 'application/json'
-    }
+    headers = {"Authorization": "Bearer %s" % token, "Content-type": "application/json"}
 
     newdata = customize_schema.customize_schema(copy.deepcopy(metadata))
-    newdata['files'] = fileinfo
-    if 'doi' not in newdata:
-        #We want tind to generate the identifier
-        newdata['final_actions'] = [{"type":"create_doi",\
-                "parameters":{"type":"records","field":"doi"}}]
+    newdata["files"] = fileinfo
+    if "doi" not in newdata:
+        # We want tind to generate the identifier
+        newdata["final_actions"] = [
+            {"type": "create_doi", "parameters": {"type": "records", "field": "doi"}}
+        ]
 
-    dat = json.dumps({'record': newdata})
+    dat = json.dumps({"record": newdata})
 
     c = session()
-    response = c.post(url,headers=headers,data=dat)
+    response = c.post(url, headers=headers, data=dat)
     return response.text