Skip to content

Commit 8686606

Browse files
author
ehanson8
committed
updates
1 parent 24c232d commit 8686606

File tree

2 files changed

+37
-13
lines changed

2 files changed

+37
-13
lines changed

getTopContainerCountByResource.py

Lines changed: 26 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -19,18 +19,25 @@
1919
ids = requests.get(baseURL + endpoint, headers=headers).json()
2020

2121
f=csv.writer(open('topContainerCountByResource.csv', 'wb'))
22-
f.writerow(['title']+['uri']+['id_0']+['id_1']+['id_2']+['id_3']+['tcCount'])
22+
f.writerow(['title']+['uri']+['id_0']+['id_1']+['id_2']+['id_3']+['topContainerCount'])
2323

2424
f2=csv.writer(open('topContainersLinks.csv', 'wb'))
2525
f2.writerow(['resourceUri']+['topContainerUri'])
2626

27+
f3=csv.writer(open('uniqueTopContainers.csv', 'wb'))
28+
f3.writerow(['topContainer']+['indicator']+['barcode'])
29+
30+
31+
total = len(ids)
2732
topContainerLinks = []
2833
uniqueTopContainers = []
2934
for id in ids:
30-
print 'id', id
35+
36+
resourceTopContainers = []
37+
print 'id', id, total, 'records remaining'
38+
total = total - 1
3139
endpoint = '/repositories/3/resources/'+str(id)
3240
output = requests.get(baseURL + endpoint, headers=headers).json()
33-
topContainers =[]
3441
title = output['title'].encode('utf-8')
3542
uri = output['uri']
3643
id0 = output['id_0']
@@ -46,24 +53,23 @@
4653
id3 = output['id_3']
4754
except:
4855
id3=''
49-
searchEndpoint = '/repositories/3/top_containers/search'
50-
output = requests.get(baseURL + searchEndpoint, headers=headers).json()
56+
# ###searchEndpoint = '/repositories/3/top_containers/search'
57+
# ###output = requests.get(baseURL + searchEndpoint, headers=headers).json()
5158
page = 1
5259
payload = {'page': page, 'page_size': '3000', 'root_record': endpoint}
5360
search = requests.get(baseURL+'/search', headers=headers, params=payload).json()
5461
results = []
5562
resultsPage = search['results']
5663
for result in resultsPage:
5764
results.append(result)
58-
5965
while resultsPage != []:
6066
page = page + 1
6167
payload = {'page': page, 'page_size': '3000', 'root_record': endpoint}
6268
search = requests.get(baseURL+'/search', headers=headers, params=payload).json()
6369
resultsPage = search['results']
6470
for result in resultsPage:
6571
results.append(result)
66-
resourceTopContainers = []
72+
6773
for result in results:
6874
try:
6975
topContainers = result['top_container_uri_u_sstr']
@@ -72,22 +78,30 @@
7278
resourceTopContainers.append(topContainer)
7379
if topContainer not in uniqueTopContainers:
7480
uniqueTopContainers.append(topContainer)
75-
topContainerLink = str(id) +'|'+topContainer
81+
topContainerLink = str(id)+'|'+topContainer
7682
if topContainerLink not in topContainerLinks:
7783
topContainerLinks.append(topContainerLink)
7884
except:
79-
topContainer = ''
85+
topContainers = []
8086
topContainerCount = len(resourceTopContainers)
8187
print 'top containers', topContainerCount
8288
f.writerow([title]+[uri]+[id0]+[id1]+[id2]+[id3]+[topContainerCount])
8389

8490
for topContainerLink in topContainerLinks:
8591
f2.writerow([topContainerLink[:topContainerLink.index('|')]]+[topContainerLink[topContainerLink.index('|')+1:]])
8692

87-
f3=csv.writer(open('uniqueTopContainers.csv', 'wb'))
88-
f3.writerow(['topContainer'])
8993
for topContainer in uniqueTopContainers:
90-
f3.writerow([topContainer])
94+
search = requests.get(baseURL+topContainer, headers=headers).json()
95+
try:
96+
indicator = search['indicator']
97+
except:
98+
indicator = ''
99+
100+
try:
101+
barcode = search['barcode']
102+
except:
103+
barcode = ''
104+
f3.writerow([topContainer]+[indicator]+[barcode])
91105

92106
elapsedTime = time.time() - startTime
93107
m, s = divmod(elapsedTime, 60)

getTopContainerCountByResourceNoAOs.py

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -71,7 +71,17 @@
7171
f3=csv.writer(open('uniqueTopContainersNoAOs.csv', 'wb'))
7272
f3.writerow(['topContainer'])
7373
for topContainer in uniqueTopContainers:
74-
f3.writerow([topContainer])
74+
search = requests.get(baseURL+topContainer, headers=headers).json()
75+
try:
76+
indicator = search['indicator']
77+
except:
78+
indicator = ''
79+
80+
try:
81+
barcode = search['barcode']
82+
except:
83+
barcode = ''
84+
f3.writerow([topContainer]+[indicator]+[barcode])
7585

7686
elapsedTime = time.time() - startTime
7787
m, s = divmod(elapsedTime, 60)

0 commit comments

Comments
 (0)