new script

ehanson8 · ehanson8 · commit 0647444860a4 · 2018-10-10T15:38:49.000-04:00
diff --git a/README.md b/README.md
@@ -34,6 +34,9 @@ Retrieves a count of archival objects associated with a particular resource. Upo
 #### [getArchivalObjectsByResource.py](/getArchivalObjectsByResource.py)
 Extracts all of the archival objects associated with a particular resource. Upon running the script, you will be prompted enter the resource ID (just the number, not the full URI).
 
+#### [getArchivalObjectRefIdsForResource.py](/getArchivalObjectRefIdsForResource.py)
+Extracts the title, URI, ref_id, and date expression for all archival objects associated with a particular resource. Upon running the script, you will be prompted enter the resource ID (just the number, not the full URI).
+
 #### [getArrayPropertiesFromAgentsPeopleCSV.py](/getArrayPropertiesFromAgentsPeopleCSV.py)
 Retrieves specific properties, including proprerties that have arrays as values, from the JSON of ArchivesSpace agent_people records. In this example, the 'dates_of existence' property contains an array that must be iterated over. This requires a second level of iteration with 'for j in range (...)' on line 20, which is in addition to the iteration function 'for i in range (...)' on line 19, which was also found in the getPropertiesFromAgentsPeopleCSV.py script. As with the previous script, it also writes the properties' values into a CSV file which is specified in variable 'f' on line 17.
 
diff --git a/getArchivalObjectRefIdsForResource.py b/getArchivalObjectRefIdsForResource.py
@@ -0,0 +1,57 @@
+import json
+import requests
+import secrets
+import time
+import csv
+
+startTime = time.time()
+
+def findKey(d, key):
+    if key in d:
+        yield d[key]
+    for k in d:
+        if isinstance(d[k], list) and k == 'children':
+            for i in d[k]:
+                for j in findKey(i, key):
+                    yield j
+
+baseURL = secrets.baseURL
+user = secrets.user
+password = secrets.password
+
+auth = requests.post(baseURL + '/users/'+user+'/login?password='+password).json()
+session = auth["session"]
+headers = {'X-ArchivesSpace-Session':session, 'Content_Type':'application/json'}
+
+resourceID= raw_input('Enter resource ID: ')
+
+f=csv.writer(open('archivalObjectRefIdForResource.csv', 'wb'))
+f.writerow(['title']+['uri']+['ref_id']+['date'])
+
+endpoint = '/repositories/3/resources/'+resourceID+'/tree'
+
+output = requests.get(baseURL + endpoint, headers=headers).json()
+archivalObjects = []
+for value in findKey(output, 'record_uri'):
+    print value
+    if 'archival_objects' in value:
+        archivalObjects.append(value)
+
+print 'downloading aos'
+for archivalObject in archivalObjects:
+    output = requests.get(baseURL + archivalObject, headers=headers).json()
+    print output
+    title = output['title']
+    uri = output['uri']
+    ref_id = output['ref_id']
+    for date in output['dates']:
+        try:
+            date = date['expression']
+        except:
+            date = ''
+    f.writerow([title]+[uri]+[ref_id]+[date])
+
+elapsedTime = time.time() - startTime
+m, s = divmod(elapsedTime, 60)
+h, m = divmod(m, 60)
+print 'Total script run time: ', '%d:%02d:%02d' % (h, m, s)