stash-wrapper 0.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,322 @@
1
+ <?xml version="1.0" encoding="UTF-8"?>
2
+ <xs:schema targetNamespace="http://dash.cdlib.org/stash_wrapper/"
3
+ xmlns="http://dash.cdlib.org/stash_wrapper/"
4
+ xmlns:xs="http://www.w3.org/2001/XMLSchema"
5
+ xmlns:vc="http://www.w3.org/2007/XMLSchema-versioning/XMLSchema-versioning.xsd" elementFormDefault="qualified"
6
+ attributeFormDefault="unqualified" vc:minVersion="1.0" vc:maxVersion="1.1">
7
+
8
+ <xs:annotation>
9
+ <xs:documentation xml:lang="en">
10
+ Stash wrapper schema, version 1.0
11
+ Copyright 2015 The Regents of the University of California
12
+ This document is available under the terms of the Creative Commons Atribution
13
+ 4.0 International (CC-BY) license,https://creativecommons.org/licenses/by/4.0/.
14
+ This schema wraps specific Stash administrative properties needed for the
15
+ Stash discovery environment that cannot be assumed to available via the
16
+ configured descriptive schema, and that descriptive schema.
17
+ </xs:documentation>
18
+ </xs:annotation>
19
+
20
+ <xs:element name="stash_wrapper" type="stash_wrapper_type">
21
+ <xs:annotation>
22
+ <xs:documentation xml:lang="en">Stash wrapper parent element</xs:documentation>
23
+ </xs:annotation>
24
+ </xs:element>
25
+
26
+ <xs:complexType name="stash_wrapper_type">
27
+ <xs:sequence>
28
+ <xs:element name="identifier" type="identifier_type" minOccurs="1"
29
+ maxOccurs="1">
30
+ <xs:annotation>
31
+ <xs:documentation xml:lang="en">
32
+ Typed dataset identifier. Identifier types are drawn from the
33
+ DataCite schema list.
34
+ </xs:documentation>
35
+ </xs:annotation>
36
+ </xs:element>
37
+
38
+ <xs:element name="stash_administrative" type="stash_administrative_type"
39
+ minOccurs="1" maxOccurs="1">
40
+ <xs:annotation>
41
+ <xs:documentation xml:lang="en">
42
+ Stash administrative metadata wrapper.
43
+ </xs:documentation>
44
+ </xs:annotation>
45
+ </xs:element>
46
+
47
+ <xs:element name="stash_descriptive" type="stash_descriptive_type" minOccurs="1"
48
+ maxOccurs="1">
49
+ <xs:annotation>
50
+ <xs:documentation xml:lang="en">
51
+ Stash descriptive metadata wrapper. It contains arbitrary
52
+ well-formed XML conforming to the configured native descriptive
53
+ schema.
54
+ </xs:documentation>
55
+ </xs:annotation>
56
+ </xs:element>
57
+ </xs:sequence>
58
+ </xs:complexType>
59
+
60
+ <xs:complexType name="identifier_type">
61
+ <xs:simpleContent>
62
+ <xs:extension base="xs:string">
63
+ <xs:attribute name="type">
64
+ <xs:annotation>
65
+ <xs:documentation xml:lang="en">
66
+ Identifier type, drawn from the list defined by the DataCite
67
+ schema.
68
+ </xs:documentation>
69
+ </xs:annotation>
70
+ <xs:simpleType>
71
+ <xs:restriction base="xs:string">
72
+ <xs:enumeration value="ARK"/>
73
+ <xs:enumeration value="DOI"/>
74
+ <xs:enumeration value="Handle"/>
75
+ <xs:enumeration value="URL"/>
76
+ </xs:restriction>
77
+ </xs:simpleType>
78
+ </xs:attribute>
79
+ </xs:extension>
80
+ </xs:simpleContent>
81
+ </xs:complexType>
82
+
83
+ <xs:complexType name="stash_administrative_type">
84
+ <xs:annotation>
85
+ <xs:documentation xml:lang="en">
86
+ Stash administrative metadata wrapper type.
87
+ </xs:documentation>
88
+ </xs:annotation>
89
+ <xs:sequence>
90
+ <xs:element name="version" type="version_type" minOccurs="1" maxOccurs="1">
91
+ <xs:annotation>
92
+ <xs:documentation xml:lang="en">
93
+ Dataset version.
94
+ </xs:documentation>
95
+ </xs:annotation>
96
+ </xs:element>
97
+ <xs:element name="license" type="license_type" minOccurs="1" maxOccurs="1">
98
+ <xs:annotation>
99
+ <xs:documentation xml:lang="en">
100
+ Dataset license.
101
+ </xs:documentation>
102
+ </xs:annotation>
103
+ </xs:element>
104
+ <xs:element name="embargo" type="embargo_type" minOccurs="1" maxOccurs="1">
105
+ <xs:annotation>
106
+ <xs:documentation xml:lang="en">
107
+ Dataset embargo.
108
+ </xs:documentation>
109
+ </xs:annotation>
110
+ </xs:element>
111
+ <xs:element name="inventory" type="inventory_type" minOccurs="0" maxOccurs="1">
112
+ <xs:annotation>
113
+ <xs:documentation xml:lang="en">
114
+ File inventory of the dataset submission package.
115
+ </xs:documentation>
116
+ </xs:annotation>
117
+ </xs:element>
118
+ </xs:sequence>
119
+ </xs:complexType>
120
+
121
+ <xs:complexType name="version_type">
122
+ <xs:annotation>
123
+ <xs:documentation xml:lang="en">
124
+ Dataset version type.
125
+ </xs:documentation>
126
+ </xs:annotation>
127
+ <xs:sequence>
128
+ <xs:element name="version_number" type="xs:positiveInteger" minOccurs="1"
129
+ maxOccurs="1">
130
+ <xs:annotation>
131
+ <xs:documentation xml:lang="en">
132
+ Dataset version number.
133
+ </xs:documentation>
134
+ </xs:annotation>
135
+ </xs:element>
136
+ <xs:element name="date" type="xs:date" minOccurs="1" maxOccurs="1">
137
+ <xs:annotation>
138
+ <xs:documentation xml:lang="en">
139
+ Dataset version date, YYYY-MM-DD.
140
+ </xs:documentation>
141
+ </xs:annotation>
142
+ </xs:element>
143
+ <xs:element name="note" type="xs:string" minOccurs="0" maxOccurs="1">
144
+ <xs:annotation>
145
+ <xs:documentation xml:lang="en">
146
+ Optional dataset version note describing the conditions leading
147
+ to the creation of version.
148
+ </xs:documentation>
149
+ </xs:annotation>
150
+ </xs:element>
151
+ </xs:sequence>
152
+ </xs:complexType>
153
+
154
+ <xs:complexType name="license_type">
155
+ <xs:annotation>
156
+ <xs:documentation xml:lang="en">
157
+ Dataset license type.
158
+ </xs:documentation>
159
+ </xs:annotation>
160
+ <xs:sequence>
161
+ <xs:element name="name" type="xs:string" minOccurs="1" maxOccurs="1">
162
+ <xs:annotation>
163
+ <xs:documentation xml:lang="en">
164
+ Dataset license name.
165
+ </xs:documentation>
166
+ </xs:annotation>
167
+ </xs:element>
168
+ <xs:element name="uri" type="xs:anyURI" minOccurs="1" maxOccurs="1">
169
+ <xs:annotation>
170
+ <xs:documentation xml:lang="en">
171
+ Dataset license URI.
172
+ </xs:documentation>
173
+ </xs:annotation>
174
+ </xs:element>
175
+ </xs:sequence>
176
+ </xs:complexType>
177
+
178
+ <xs:complexType name="embargo_type">
179
+ <xs:annotation>
180
+ <xs:documentation xml:lang="en">
181
+ Dataset embargo type.
182
+ </xs:documentation>
183
+ </xs:annotation>
184
+ <xs:sequence>
185
+ <xs:element name="type" type="embargo_type_type" minOccurs="1" maxOccurs="1">
186
+ <xs:annotation>
187
+ <xs:documentation xml:lang="en">
188
+ Dataset embargo type.
189
+ </xs:documentation>
190
+ </xs:annotation>
191
+ </xs:element>
192
+ <xs:element name="period" type="xs:string" minOccurs="1" maxOccurs="1">
193
+ <xs:annotation>
194
+ <xs:documentation xml:lang="en">
195
+ Dataset emabargo period, i.e., a textual description of the
196
+ period, e.g., "6 months". If the embargo type is "none", this
197
+ value is ignored, but should be set to "none".
198
+ </xs:documentation>
199
+ </xs:annotation>
200
+ </xs:element>
201
+ <xs:element name="start" type="xs:date" minOccurs="1" maxOccurs="1">
202
+ <xs:annotation>
203
+ <xs:documentation xml:lang="en">
204
+ Dataset embargo start date. This should be set to the date
205
+ at which the embargo (and Stash wrapper instance document) is
206
+ created.
207
+ </xs:documentation>
208
+ </xs:annotation>
209
+ </xs:element>
210
+ <xs:element name="end" type="xs:date" minOccurs="1" maxOccurs="1">
211
+ <xs:annotation>
212
+ <xs:documentation xml:lang="en">
213
+ Dataset embargo end date. If the embargo type is "none", this
214
+ value is ignored, but should be set to the start date.
215
+ </xs:documentation>
216
+ </xs:annotation>
217
+ </xs:element>
218
+ </xs:sequence>
219
+ </xs:complexType>
220
+
221
+ <xs:simpleType name="embargo_type_type">
222
+ <xs:annotation>
223
+ <xs:documentation xml:lang="en">
224
+ Dataset embargo type: none, download, description.
225
+ </xs:documentation>
226
+ </xs:annotation>
227
+ <xs:restriction base="xs:string">
228
+ <xs:enumeration value="none"/>
229
+ <xs:enumeration value="download"/>
230
+ <xs:enumeration value="description"/>
231
+ </xs:restriction>
232
+ </xs:simpleType>
233
+
234
+ <xs:complexType name="inventory_type">
235
+ <xs:annotation>
236
+ <xs:documentation xml:lang="en">
237
+ Dataset file inventory type.
238
+ </xs:documentation>
239
+ </xs:annotation>
240
+ <xs:sequence>
241
+ <xs:element name="file" type="file_type" minOccurs="0" maxOccurs="unbounded">
242
+ <xs:annotation>
243
+ <xs:documentation xml:lang="en">
244
+ Dataset submission package file.
245
+ </xs:documentation>
246
+ </xs:annotation>
247
+ </xs:element>
248
+ </xs:sequence>
249
+ <xs:attribute name="num_files" type="xs:nonNegativeInteger">
250
+ <xs:annotation>
251
+ <xs:documentation xml:lang="en">
252
+ Number of files in the submission package inventory.
253
+ </xs:documentation>
254
+ </xs:annotation>
255
+ </xs:attribute>
256
+ </xs:complexType>
257
+
258
+ <xs:complexType name="file_type">
259
+ <xs:annotation>
260
+ <xs:documentation xml:lang="en">
261
+ Dataset inventory file type.
262
+ </xs:documentation>
263
+ </xs:annotation>
264
+ <xs:sequence>
265
+ <xs:element name="pathname" type="xs:string" minOccurs="1" maxOccurs="1">
266
+ <xs:annotation>
267
+ <xs:documentation xml:lang="en">
268
+ Dataset file pathname.
269
+ </xs:documentation>
270
+ </xs:annotation>
271
+ </xs:element>
272
+
273
+ <xs:element name="size" type="size_type" minOccurs="1" maxOccurs="1">
274
+ <xs:annotation>
275
+ <xs:documentation xml:lang="en">
276
+ Dataset file size, as an integer.
277
+ </xs:documentation>
278
+ </xs:annotation>
279
+ </xs:element>
280
+
281
+ <xs:element name="mime_type" type="xs:string" minOccurs="1" maxOccurs="1">
282
+ <xs:annotation>
283
+ <xs:documentation xml:lang="en">
284
+ Dataset file MIME type.
285
+ </xs:documentation>
286
+ </xs:annotation>
287
+ </xs:element>
288
+ </xs:sequence>
289
+ </xs:complexType>
290
+
291
+ <xs:complexType name="size_type">
292
+ <xs:annotation>
293
+ <xs:documentation xml:lang="en">
294
+ Dataset file size type.
295
+ </xs:documentation>
296
+ </xs:annotation>
297
+ <xs:simpleContent>
298
+ <xs:extension base="xs:nonNegativeInteger">
299
+ <xs:attribute name="unit">
300
+ <xs:simpleType>
301
+ <xs:restriction base="xs:string">
302
+ <xs:enumeration value="B"/>
303
+ </xs:restriction>
304
+ </xs:simpleType>
305
+ </xs:attribute>
306
+ </xs:extension>
307
+ </xs:simpleContent>
308
+ </xs:complexType>
309
+
310
+ <xs:complexType name="stash_descriptive_type">
311
+ <xs:annotation>
312
+ <xs:documentation xml:lang="en">
313
+ Stash descriptive metadata wrapper type. This contains arbitrary well-formed
314
+ XML conforming to the configured descriptive schema.
315
+ </xs:documentation>
316
+ </xs:annotation>
317
+ <xs:sequence>
318
+ <xs:any namespace="##any" processContents="lax" minOccurs="0"
319
+ maxOccurs="unbounded"/>
320
+ </xs:sequence>
321
+ </xs:complexType>
322
+ </xs:schema>
@@ -0,0 +1,56 @@
1
+ <?xml version="1.0" encoding="UTF-8"?>
2
+ <st:stash_wrapper xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
3
+ xsi:schemaLocation="http://dash.cdlib.org/stash_wrapper/ http://dash.cdlib.org/stash_wrapper/stash_wrapper.xsd"
4
+ xmlns:st="http://dash.cdlib.org/stash_wrapper/">
5
+ <st:identifier type="DOI">10.12345/1234567890</st:identifier>
6
+ <st:stash_administrative>
7
+ <st:version>
8
+ <st:version_number>1</st:version_number>
9
+ <st:date>2015-09-08</st:date>
10
+ </st:version>
11
+ <st:license>
12
+ <st:name>Creative Commons Attribution 4.0 International (CC-BY)</st:name>
13
+ <st:uri>https://creativecommons.org/licenses/by/4.0/legalcode</st:uri>
14
+ </st:license>
15
+ <st:embargo>
16
+ <st:type>download</st:type>
17
+ <st:period>6 months</st:period>
18
+ <st:start>2015-09-08</st:start>
19
+ <st:end>2016-03-07</st:end>
20
+ </st:embargo>
21
+ <st:inventory num_files="1">
22
+ <st:file>
23
+ <st:pathname>mydata.xlsx</st:pathname>
24
+ <st:size unit="B">12345678</st:size>
25
+ <st:mime_type>application/vnd.openxmlformats-officedocument.spreadsheetml.sheet</st:mime_type>
26
+ </st:file>
27
+ </st:inventory>
28
+ </st:stash_administrative>
29
+ <st:stash_descriptive>
30
+ <dcs:resource xmlns:dcs="http://datacite.org/schema/kernel-3"
31
+ xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
32
+ xsi:schemaLocation="http://datacite.org/schema/kernel-3
33
+ http://schema.datacite.org/meta/kernel-3/metadata.xsd">
34
+ <dcs:identifier identifierType="DOI">10.12345/1234567890</dcs:identifier>
35
+ <dcs:creators>
36
+ <dcs:creator>
37
+ <dcs:creatorName>Abrams, Stephen</dcs:creatorName>
38
+ </dcs:creator>
39
+ </dcs:creators>
40
+ <dcs:titles>
41
+ <dcs:title>My dataset</dcs:title>
42
+ </dcs:titles>
43
+ <dcs:publisher>UC Office of the President</dcs:publisher>
44
+ <dcs:publicationYear>2016</dcs:publicationYear>
45
+ <dcs:subjects>
46
+ <dcs:subject>Data literacy</dcs:subject>
47
+ </dcs:subjects>
48
+ <dcs:resourceType resourceTypeGeneral="Dataset">Spreadsheet</dcs:resourceType>
49
+ <dcs:descriptions>
50
+ <dcs:description descriptionType="Abstract">
51
+ Lorum ipsum.
52
+ </dcs:description>
53
+ </dcs:descriptions>
54
+ </dcs:resource>
55
+ </st:stash_descriptive>
56
+ </st:stash_wrapper>
@@ -0,0 +1,88 @@
1
+ <?xml version="1.0" encoding="UTF-8"?>
2
+ <resource xmlns='http://datacite.org/schema/kernel-3' xmlns:xsi='http://www.w3.org/2001/XMLSchema-instance'
3
+ xsi:schemaLocation='http://datacite.org/schema/kernel-3 http://schema.datacite.org/meta/kernel-3/metadata.xsd'>
4
+ <identifier identifierType='DOI'>10.14749/1407399498</identifier>
5
+ <creators>
6
+ <creator>
7
+ <creatorName>Zuma, Khangelani</creatorName>
8
+ </creator>
9
+ <creator>
10
+ <creatorName>Human Sciences Research Council</creatorName>
11
+ </creator>
12
+ </creators>
13
+ <titles>
14
+ <title xml:lang='en'>HSRC Master Sample II</title>
15
+ </titles>
16
+ <publisher>HSRC - Human Science Research Council SA</publisher>
17
+ <publicationYear>2014</publicationYear>
18
+ <contributors>
19
+ <contributor contributorType='Distributor'>
20
+ <contributorName>Human Sciences Research Council</contributorName>
21
+ </contributor>
22
+ <contributor contributorType='Funder'>
23
+ <contributorName>Human Sciences Research Council</contributorName>
24
+ </contributor>
25
+ <contributor contributorType='RightsHolder'>
26
+ <contributorName>Human Sciences Research Council</contributorName>
27
+ </contributor>
28
+ </contributors>
29
+ <language>eng</language>
30
+ <resourceType resourceTypeGeneral='Dataset'/>
31
+ <version>1.0</version>
32
+ <rightsList>
33
+ <rights>
34
+ By accessing the data, you give assurance that The data and documentation will not be duplicated, redistributed or sold without prior approval from
35
+ the rights holder. The data will be used for scientific research or educational purposes only. The data will only be used for the specified
36
+ purpose. If it is used for another purpose the additional purpose will be registered. Redundant data files will be destroyed. The confidentiality of
37
+ individuals/organisations in the data will be preserved at all times. No attempt will be made to obtain or derive information from the data to
38
+ identify individuals/organisations. The HSRC will be acknowledged in all published and unpublished works based on the data according to the provided
39
+ citation. The HSRC will be informed of any books, articles, conference papers, theses, dissertations, reports or other publications resulting from
40
+ work based in whole or in part on the data and documentation. For archiving and bibliographic purposes an electronic copy of all reports and
41
+ publications based on the requested data will be sent to the HSRC. To offer for deposit into the HSRC Data Collection any new data sets which have
42
+ been derived from or which have been created by the combination of the data supplied with other data. The data team bears no responsibility for use of
43
+ the data or for interpretations or inferences based upon such uses. Failure to comply with the End User License may result in sanctions being imposed.
44
+ </rights>
45
+ </rightsList>
46
+ <descriptions>
47
+ <description descriptionType='Abstract' xml:lang='en'>
48
+ &lt;p&gt; The 2005 HSRC Master Sample was used for SABSSM 2008 and 2012, the SANHANES study in 2012 and SASAS 2007-2010 (adjacent EAs) to obtain an
49
+ understanding of geographical spread of HIV/AIDS, perceptions and attitudes of people and other health related studies over time.&lt;/p&gt;
50
+ </description>
51
+ <description descriptionType='Abstract' xml:lang='en'>
52
+ &lt;p&gt; A sample can be defined as a subset containing the characteristics of a larger population. Samples are used in statistical testing when
53
+ population sizes are too large for the test to include all possible members or observations. A sample should represent the whole population and not
54
+ reflect bias toward a specific attribute.[1]&lt;/p&gt; &lt;p&gt; One of the most crucial aspects of sample design in household surveys is its
55
+ frame. The sampling frame has significant implications on the cost and the quality of any survey, household or otherwise.[2]&lt;/p&gt; &lt;p&gt; The
56
+ sampling frame .... in a household survey must cover the entire target population. When that frame is used for multiple surveys or multiple rounds of
57
+ the same survey it is known as a master sample frame or .... master sample.[3]&lt;/p&gt; &lt;p&gt; A master sample is a sample drawn from a population
58
+ for use on a number of future occasions, so as to avoid ad hoc sampling on each occasion. Sometimes the master sample is large and subsequent
59
+ inquiries are based on a sub-sample from it.[4]&lt;/p&gt; &lt;p&gt; The HSRC compiles master samples in order to construct samples for various HSRC
60
+ research studies. The 2005 HSRC Master Sample was used for SABSSM 2008 and 2012, SASAS 2007-2010 and the SANHANES study in 2012 to obtain an
61
+ understanding of geographical spread of HIV/AIDS, perceptions and attitudes of people and other health related studies over time.&lt;/p&gt; &lt;p&gt;
62
+ The 2005 HSRC Master Sample was created in the following way:&lt;/p&gt; &lt;p&gt; South Africa was delineated into EAs according to municipality and
63
+ province. Municipal boundaries were obtained from the Municipal Demarcation Board. An Enumeration area (EA) is the smallest geographical unit (piece
64
+ of land) into which the country is divided for census or survey enumeration.[5] The concepts and definitions of terms used for Census 2001 comply in
65
+ most instances with United Nations standards for censuses.&lt;/p&gt; &lt;p&gt; A total of 1,000 census enumeration areas (EAs) from the 2001
66
+ population census were randomly selected using probability proportional to size and stratified by province, locality type and race in urban areas from
67
+ a database of 80 787 EAs that were mapped using aerial photography to develop an HSRC master sample for selecting households.&lt;/p&gt; &lt;p&gt; The
68
+ ideal frame would be complete with respect to the target population if all of its members (the universe) are covered by the frame.&lt;/p&gt; &lt;p&gt;
69
+ Ideal characteristics of a master sample:&lt;/p&gt; &lt;ul&gt; &lt;li&gt; The master frame should be as complete, accurate and current as
70
+ practicable.&lt;/li&gt; &lt;li&gt; A master sample frame for household surveys is typically developed from the most recent census, just as a regular
71
+ sample frame is.&lt;/li&gt; &lt;li&gt; Because the master frame may be used during an entire intercensal (between census) period, however, it will
72
+ usually require periodic and regular updating such as every 2-3 years.&lt;/li&gt; &lt;li&gt; This is in contrast to a regular frame which is more
73
+ likely to be up-dated on an ad hoc basis and only when a particular survey is being planned[6]&lt;/li&gt; &lt;/ul&gt; &lt;p&gt; [1]
74
+ http://www.investopedia.com/terms/s/sample.asp&lt;/p&gt; &lt;p&gt; [2]
75
+ http://unstats.un.org/unsd/demographic/meetings/egm/sampling_1203/docs/no_3.pdf&lt;/p&gt; &lt;p&gt; [3]
76
+ http://unstats.un.org/unsd/demographic/meetings/egm/sampling_1203/docs/no_3.pdf&lt;/p&gt; &lt;p&gt; [4] A Dictionary of Statistical Terms, 5th
77
+ edition, prepared for the International Statistical Institute by F.H.C. Marriott. Published for the International Statistical Institute by Longman
78
+ Scientific and Technical. http://stats.oecd.org/glossary/detail.asp?ID=3708&lt;/p&gt; &lt;p&gt; [5]
79
+ http://africageodownloads.info/128_mokgokolo.pdf&lt;/p&gt; &lt;p&gt; [6]
80
+ http://unstats.un.org/unsd/demographic/meetings/egm/sampling_1203/docs/no_3.pdf&lt;/p&gt;
81
+ </description>
82
+ </descriptions>
83
+ <geoLocations>
84
+ <geoLocation>
85
+ <geoLocationPlace>National - all 9 provinces</geoLocationPlace>
86
+ </geoLocation>
87
+ </geoLocations>
88
+ </resource>