forked from ehanson8/dspace-editing
-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathcreateGrosmanItemMetadataFromCSV.py
86 lines (75 loc) · 3.46 KB
/
createGrosmanItemMetadataFromCSV.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
# -*- coding: utf-8 -*-
import json
import csv
def createMetadataElementCSV(key, valueSource, lang):
value = row[valueSource].strip()
if value != '':
if lang != '':
metadataElement = {'key': key, 'language': lang, 'value': value}
metadata.append(metadataElement)
elif key == 'dc.date.issued' and '/' in value:
value = value.replace('/', '--')
metadataElement = {'key': key, 'language': lang, 'value': value}
metadata.append(metadataElement)
else:
metadataElement = {'key': key, 'value': value}
metadata.append(metadataElement)
else:
pass
def createMetadataElementCSVSplitField(key, valueSource, lang):
if row[valueSource] != '':
if '|' in row[valueSource]:
values = row[valueSource].split('|')
for value in values:
if lang != '':
metadataElement = {'key': key, 'language': lang, 'value': value}
metadata.append(metadataElement)
else:
metadataElement = {'key': key, 'value': value}
metadata.append(metadataElement)
else:
value = row[valueSource]
if lang != '':
metadataElement = {'key': key, 'language': lang, 'value': value}
metadata.append(metadataElement)
else:
metadataElement = {'key': key, 'value': value}
metadata.append(metadataElement)
else:
pass
def createMetadataElementDirect(key, value, lang):
if lang != '':
metadataElement = {'key': key, 'language': lang, 'value': value}
metadata.append(metadataElement)
else:
metadataElement = {'key': key, 'value': value}
metadata.append(metadataElement)
fileName = input('Enter fileName (including \'.csv\'): ')
with open(fileName) as csvfile:
reader = csv.DictReader(csvfile)
counter = 0
metadataGroup = []
for row in reader:
metadata = []
createMetadataElementCSV('fileIdentifier', 'identifier', '')
createMetadataElementCSVSplitField('dc.contributor.other', 'dc.contributor.other', '')
createMetadataElementCSV('dc.date.issued', 'dc.date.issued', '')
createMetadataElementCSVSplitField('dc.description', 'dc.description', 'en_US')
createMetadataElementCSVSplitField('dc.description.statementofresponsibility', 'dc.description.statementofresponsibility', 'en_US')
createMetadataElementCSV('dc.format.extent', 'dc.format.extent', '')
createMetadataElementDirect('dc.format.mimetype', 'image/tiff', 'en_US')
createMetadataElementCSV('dc.format.medium', 'dc.format.medium', 'en_US')
createMetadataElementCSV('dc.publisher', 'dc.publisher', 'en_US')
createMetadataElementCSVSplitField('dcterms.rights', 'dcterms.rights', '')
createMetadataElementCSVSplitField('dc.subject.other', 'dc.subject.other', 'en_US')
createMetadataElementCSV('dc.title', 'dc.title', '')
createMetadataElementCSV('dc.type', 'dc.type', 'en_US')
createMetadataElementCSVSplitField('dc.title.alternative', 'dc.title.alternative', '')
createMetadataElementCSV('dcterms.accessRights', 'dcterms.accessRights', 'en_US')
print(len(metadata))
item = {'metadata': metadata}
metadataGroup.append(item)
counter = counter + 1
print(counter)
f = open('sample_metadata.json', 'w')
json.dump(metadataGroup, f)