-
Notifications
You must be signed in to change notification settings - Fork 27
/
Copy pathexample.py
253 lines (228 loc) · 10.3 KB
/
example.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
# This software is licenced under the BSD 3-Clause licence
# available at https://opensource.org/licenses/BSD-3-Clause
# and described in the LICENCE file in the root of this project
"""
Example Python 3 application using the dspace.py API client library to create
some resources in a DSpace 7 repository.
"""
from pprint import pprint
import os
import sys
from dspace_rest_client.client import DSpaceClient
from dspace_rest_client.models import Community, Collection, Item, Bundle, Bitstream
DEFAULT_URL = 'http://localhost:8080/server/api'
DEFAULT_USERNAME = '[email protected]'
DEFAULT_PASSWORD = 'password'
# Configuration from environment variables
URL = os.environ.get('DSPACE_API_ENDPOINT', DEFAULT_URL)
USERNAME = os.environ.get('DSPACE_API_USERNAME', DEFAULT_USERNAME)
PASSWORD = os.environ.get('DSPACE_API_PASSWORD', DEFAULT_PASSWORD)
# Instantiate DSpace client
# Note the 'fake_user_agent' setting here -- this will set a string like the following,
# to get by Cloudfront:
# Mozilla/5.0 (Windows NT 6.2; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) \
# Chrome/39.0.2171.95 Safari/537.36
# The default is to *not* fake the user agent, and instead use the default of
# DSpace-Python-REST-Client/x.y.z
# To specify a custom user agent, set the USER_AGENT env variable and leave/set
# fake_user_agent as False
d = DSpaceClient(api_endpoint=URL, username=USERNAME, password=PASSWORD, fake_user_agent=True)
# Authenticate against the DSpace client
authenticated = d.authenticate()
if not authenticated:
print('Error logging in! Giving up.')
sys.exit(1)
# An example of searching for workflow items (any search configuration from discovery.xml can be used)
# note that the results here depend on the workflow role / access of the logged in user
search_results = d.search_objects(query='*:*', dso_type='item', configuration='workflow')
for result in search_results:
print(f'{result.name} ({result.uuid})')
# Put together some basic Community data.
# See https://github.com/DSpace/RestContract/blob/main/communities.md
community_data = {
'name': 'Community created by the Python REST Client',
'metadata': {
'dc.title': [
{'value': 'Community created by the Python REST Client',
'language': 'en', 'authority': None, 'confidence': -1
},
{'value': 'Vom Python-REST-Client erstellte Community',
'language': 'de', 'authority': None, 'confidence': -1
}
]
}
}
# Create the new community
# In this example, we'll just make this a top-level community by
# passing None as the parent parameter
COMMUNITY_PARENT = None
new_community = d.create_community(parent=COMMUNITY_PARENT, data=community_data)
if isinstance(new_community, Community) and new_community.uuid is not None:
print(f'New community created! Handle: {new_community.handle}')
else:
print('Error! Giving up.')
sys.exit(1)
# Update the community metadata
new_community.name = 'Community created by the Python REST Client - Updated Name'
new_community.metadata['dc.title'][0] = {
'value': 'Community created by the Python REST Client - Updated Name',
'language': 'en', 'authority': None, 'confidence': -1
}
# Linked resources can be embedded with responses, e.g.
updated_community = d.update_dso(new_community, embeds=['logo', 'collections'])
# Print logo (it'll be None in this case, but just an example
print(f"Logo for updated community is {updated_community.embedded['logo']}")
# Put together some basic Collection data.
# See https://github.com/DSpace/RestContract/blob/main/collections.md
collection_data = {
'name': 'Collection created by the Python REST Client',
'metadata': {
'dc.title': [
{'value': 'Collection created by the Python REST Client',
'language': 'en', 'authority': None, 'confidence': -1
},
{'value': 'Vom Python-REST-Client erstellte Sammlung',
'language': 'de', 'authority': None, 'confidence': -1
}
]
}
}
# Create the new collection
# In this example, we'll pass the new community UUID as our parent container
collection_parent = new_community.uuid
new_collection = d.create_collection(parent=collection_parent, data=collection_data)
if isinstance(new_collection, Collection) and new_collection.uuid is not None:
print(f'New collection created! Handle: {new_collection.handle}')
else:
print('Error! Giving up.')
sys.exit(1)
# Put together some basic Item data.
# (See: https://github.com/DSpace/RestContract/blob/main/items.md)
item_data = {
"name": "Test Item created by the Python REST Client",
"metadata": {
"dc.contributor.author": [
{
"value": "Shepherd, Kim",
"language": "en",
"authority": None,
"confidence": -1
}
],
"dc.title": [
{
"value": "Test Item created by the Python REST Client",
"language": "en",
"authority": None,
"confidence": -1
}
],
"dc.type": [
{
"value": "Journal Article",
"language": "en",
"authority": None,
"confidence": -1
}
]
},
"inArchive": True,
"discoverable": True,
"withdrawn": False,
"type": "item"
}
# The creation process for an item is a bit different, because they're typically a bit more
# complex than a container object. However, they're all DSOs at the end of the day so we
# could make usage fully consistent if we wanted.
#
# Instantiate an empty Item, passing the full API resource data to the constructor.
item = Item(item_data)
# Create the item using the new collection as the parent container.
# Note that we're passing the full Item object here, not just the dict data
# (though it will be serialised to a dict before the final POST)
new_item = d.create_item(parent=new_collection.uuid, item=item)
if isinstance(new_item, Item) and new_item.uuid is not None:
print(f'New item created! Handle: {new_item.handle}')
else:
print('Error! Giving up.')
sys.exit(1)
# Add a single metadata field+value to the item (PATCH operation)
updated_item = d.add_metadata(dso=new_item, field='dc.description.abstract',
value='Added abstract to an existing item',
language='en', authority=None, confidence=-1)
# Create a new ORIGINAL bundle
# See https://github.com/DSpace/RestContract/blob/main/bundles.md
new_bundle = d.create_bundle(parent=new_item, name='ORIGINAL')
if isinstance(new_bundle, Bundle) and new_bundle.uuid is not None:
print(f'New bundle created! UUID: {new_bundle.uuid}')
else:
print('Error! Giving up.')
sys.exit(1)
# Create and upload a new bitstream using the LICENSE.txt file in this project
# Set bitstream metadata
# See https://github.com/DSpace/RestContract/blob/main/bitstreams.md
bitstream_metadata = {
'dc.description':
[{"value": "Bitstream uploaded by Python REST Client", 'language': 'en',
'authority': None, 'confidence': -1, 'place': 0}]
}
# Set the mime type (using mimetypes.guess_type is recommended for real uploads if you
# don't want to set manually)
FILE_MIME = 'text/plain'
# Set a better file name for our test upload
FILE_NAME = 'uploaded_file.txt'
# Create the bitstream and upload the file
new_bitstream = d.create_bitstream(bundle=new_bundle, name=FILE_NAME,
path='LICENSE.txt', mime=FILE_MIME, metadata=bitstream_metadata)
if isinstance(new_bitstream, Bitstream) and new_bitstream.uuid is not None:
print(f'New bitstream created! UUID: {new_bitstream.uuid}')
else:
print('Error! Giving up.')
sys.exit(1)
print('All finished with example data creation. Visit your test repository to review \
created objects')
# Retrieving objects - now that we know there is some data in the repository we can demonstrate
# some simple ways of retrieving and iterating DSOs
print('\nBeginning examples of get, search methods\n')
# Get top communities
top_communities = d.get_communities(top=True)
for top_community in top_communities:
print(f'{top_community.name} ({top_community.uuid})')
# Get all collections in this community
collections = d.get_collections(community=top_community)
for collection in collections:
print(f'{collection.name} ({collection.uuid}')
# Get all items in this collection - see that the recommended method is a search,
# scoped to this collection
# (there is no collection/items endpoint, though there is a /mappedItems endpoint,
# not yet implemented here)
items = d.search_objects(query='*:*', scope=collection.uuid, dso_type='item', configuration='default')
for item in items:
print(f'{item.name} ({item.uuid})')
# Get all bundles in this item
bundles = d.get_bundles(parent=item)
for bundle in bundles:
print(f'{bundle.name} ({bundle.uuid}')
# Get all bitstreams in this bundle
bitstreams = d.get_bitstreams(bundle=bundle)
for bitstream in bitstreams:
print(f'{bitstream.name} ({bitstream.uuid}')
# Download this bitstream
r = d.download_bitstream(bitstream.uuid)
if r is not None and r.headers is not None:
print(
'\tHeaders (server info, not calculated locally)\n'
f'\tmd5: {r.headers.get("ETag")}\n'
f'\tformat: {r.headers.get("Content-Type")}\n'
f'\tlength: {r.headers.get("Content-Length")}\n'
f'\tLOCAL LEN(): {len(r.content)}'
)
# Uncomment the below to get the binary data in content and then do
# something with it like print, or write to file, etc. You want to use
# the 'content' property of the response object
#
# print(r.content)
# Finally, let's show the new _iter methods which will transparently handle pagination
# and return iterators which you can use as normal
for i, search_result in enumerate(d.search_objects_iter('*:*')):
print(f'Result #{i}: {search_result.name} ({search_result.uuid})')