stash-wrapper 0.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/.gitignore +46 -0
- data/.rubocop.yml +24 -0
- data/.ruby-version +1 -0
- data/.travis.yml +2 -0
- data/.yardopts +1 -0
- data/CHANGES.md +7 -0
- data/Gemfile +3 -0
- data/LICENSE.md +22 -0
- data/README.md +230 -0
- data/Rakefile +47 -0
- data/data/kernel3_to_oaidc.xsl +220 -0
- data/example.rb +52 -0
- data/lib/stash/wrapper.rb +6 -0
- data/lib/stash/wrapper/descriptive_node.rb +38 -0
- data/lib/stash/wrapper/embargo.rb +30 -0
- data/lib/stash/wrapper/embargo_type.rb +10 -0
- data/lib/stash/wrapper/identifier.rb +21 -0
- data/lib/stash/wrapper/identifier_type.rb +13 -0
- data/lib/stash/wrapper/inventory.rb +22 -0
- data/lib/stash/wrapper/license.rb +30 -0
- data/lib/stash/wrapper/module_info.rb +13 -0
- data/lib/stash/wrapper/size.rb +23 -0
- data/lib/stash/wrapper/size_unit.rb +11 -0
- data/lib/stash/wrapper/stash_administrative.rb +33 -0
- data/lib/stash/wrapper/stash_file.rb +57 -0
- data/lib/stash/wrapper/stash_wrapper.rb +130 -0
- data/lib/stash/wrapper/version.rb +24 -0
- data/spec/.rubocop.yml +7 -0
- data/spec/data/metadata.xsd +380 -0
- data/spec/data/wrapper/mrtoai-wrapper.xml +73 -0
- data/spec/data/wrapper/stash_wrapper.xsd +322 -0
- data/spec/data/wrapper/wrapper-1.xml +56 -0
- data/spec/data/wrapper/wrapper-2-payload.xml +88 -0
- data/spec/data/wrapper/wrapper-2.xml +164 -0
- data/spec/rspec_custom_matchers.rb +69 -0
- data/spec/spec_helper.rb +31 -0
- data/spec/unit/stash/wrapper/stash_wrapper_spec.rb +239 -0
- data/stash-wrapper.gemspec +39 -0
- metadata +245 -0
@@ -0,0 +1,322 @@
|
|
1
|
+
<?xml version="1.0" encoding="UTF-8"?>
|
2
|
+
<xs:schema targetNamespace="http://dash.cdlib.org/stash_wrapper/"
|
3
|
+
xmlns="http://dash.cdlib.org/stash_wrapper/"
|
4
|
+
xmlns:xs="http://www.w3.org/2001/XMLSchema"
|
5
|
+
xmlns:vc="http://www.w3.org/2007/XMLSchema-versioning/XMLSchema-versioning.xsd" elementFormDefault="qualified"
|
6
|
+
attributeFormDefault="unqualified" vc:minVersion="1.0" vc:maxVersion="1.1">
|
7
|
+
|
8
|
+
<xs:annotation>
|
9
|
+
<xs:documentation xml:lang="en">
|
10
|
+
Stash wrapper schema, version 1.0
|
11
|
+
Copyright 2015 The Regents of the University of California
|
12
|
+
This document is available under the terms of the Creative Commons Atribution
|
13
|
+
4.0 International (CC-BY) license,https://creativecommons.org/licenses/by/4.0/.
|
14
|
+
This schema wraps specific Stash administrative properties needed for the
|
15
|
+
Stash discovery environment that cannot be assumed to available via the
|
16
|
+
configured descriptive schema, and that descriptive schema.
|
17
|
+
</xs:documentation>
|
18
|
+
</xs:annotation>
|
19
|
+
|
20
|
+
<xs:element name="stash_wrapper" type="stash_wrapper_type">
|
21
|
+
<xs:annotation>
|
22
|
+
<xs:documentation xml:lang="en">Stash wrapper parent element</xs:documentation>
|
23
|
+
</xs:annotation>
|
24
|
+
</xs:element>
|
25
|
+
|
26
|
+
<xs:complexType name="stash_wrapper_type">
|
27
|
+
<xs:sequence>
|
28
|
+
<xs:element name="identifier" type="identifier_type" minOccurs="1"
|
29
|
+
maxOccurs="1">
|
30
|
+
<xs:annotation>
|
31
|
+
<xs:documentation xml:lang="en">
|
32
|
+
Typed dataset identifier. Identifier types are drawn from the
|
33
|
+
DataCite schema list.
|
34
|
+
</xs:documentation>
|
35
|
+
</xs:annotation>
|
36
|
+
</xs:element>
|
37
|
+
|
38
|
+
<xs:element name="stash_administrative" type="stash_administrative_type"
|
39
|
+
minOccurs="1" maxOccurs="1">
|
40
|
+
<xs:annotation>
|
41
|
+
<xs:documentation xml:lang="en">
|
42
|
+
Stash administrative metadata wrapper.
|
43
|
+
</xs:documentation>
|
44
|
+
</xs:annotation>
|
45
|
+
</xs:element>
|
46
|
+
|
47
|
+
<xs:element name="stash_descriptive" type="stash_descriptive_type" minOccurs="1"
|
48
|
+
maxOccurs="1">
|
49
|
+
<xs:annotation>
|
50
|
+
<xs:documentation xml:lang="en">
|
51
|
+
Stash descriptive metadata wrapper. It contains arbitrary
|
52
|
+
well-formed XML conforming to the configured native descriptive
|
53
|
+
schema.
|
54
|
+
</xs:documentation>
|
55
|
+
</xs:annotation>
|
56
|
+
</xs:element>
|
57
|
+
</xs:sequence>
|
58
|
+
</xs:complexType>
|
59
|
+
|
60
|
+
<xs:complexType name="identifier_type">
|
61
|
+
<xs:simpleContent>
|
62
|
+
<xs:extension base="xs:string">
|
63
|
+
<xs:attribute name="type">
|
64
|
+
<xs:annotation>
|
65
|
+
<xs:documentation xml:lang="en">
|
66
|
+
Identifier type, drawn from the list defined by the DataCite
|
67
|
+
schema.
|
68
|
+
</xs:documentation>
|
69
|
+
</xs:annotation>
|
70
|
+
<xs:simpleType>
|
71
|
+
<xs:restriction base="xs:string">
|
72
|
+
<xs:enumeration value="ARK"/>
|
73
|
+
<xs:enumeration value="DOI"/>
|
74
|
+
<xs:enumeration value="Handle"/>
|
75
|
+
<xs:enumeration value="URL"/>
|
76
|
+
</xs:restriction>
|
77
|
+
</xs:simpleType>
|
78
|
+
</xs:attribute>
|
79
|
+
</xs:extension>
|
80
|
+
</xs:simpleContent>
|
81
|
+
</xs:complexType>
|
82
|
+
|
83
|
+
<xs:complexType name="stash_administrative_type">
|
84
|
+
<xs:annotation>
|
85
|
+
<xs:documentation xml:lang="en">
|
86
|
+
Stash administrative metadata wrapper type.
|
87
|
+
</xs:documentation>
|
88
|
+
</xs:annotation>
|
89
|
+
<xs:sequence>
|
90
|
+
<xs:element name="version" type="version_type" minOccurs="1" maxOccurs="1">
|
91
|
+
<xs:annotation>
|
92
|
+
<xs:documentation xml:lang="en">
|
93
|
+
Dataset version.
|
94
|
+
</xs:documentation>
|
95
|
+
</xs:annotation>
|
96
|
+
</xs:element>
|
97
|
+
<xs:element name="license" type="license_type" minOccurs="1" maxOccurs="1">
|
98
|
+
<xs:annotation>
|
99
|
+
<xs:documentation xml:lang="en">
|
100
|
+
Dataset license.
|
101
|
+
</xs:documentation>
|
102
|
+
</xs:annotation>
|
103
|
+
</xs:element>
|
104
|
+
<xs:element name="embargo" type="embargo_type" minOccurs="1" maxOccurs="1">
|
105
|
+
<xs:annotation>
|
106
|
+
<xs:documentation xml:lang="en">
|
107
|
+
Dataset embargo.
|
108
|
+
</xs:documentation>
|
109
|
+
</xs:annotation>
|
110
|
+
</xs:element>
|
111
|
+
<xs:element name="inventory" type="inventory_type" minOccurs="0" maxOccurs="1">
|
112
|
+
<xs:annotation>
|
113
|
+
<xs:documentation xml:lang="en">
|
114
|
+
File inventory of the dataset submission package.
|
115
|
+
</xs:documentation>
|
116
|
+
</xs:annotation>
|
117
|
+
</xs:element>
|
118
|
+
</xs:sequence>
|
119
|
+
</xs:complexType>
|
120
|
+
|
121
|
+
<xs:complexType name="version_type">
|
122
|
+
<xs:annotation>
|
123
|
+
<xs:documentation xml:lang="en">
|
124
|
+
Dataset version type.
|
125
|
+
</xs:documentation>
|
126
|
+
</xs:annotation>
|
127
|
+
<xs:sequence>
|
128
|
+
<xs:element name="version_number" type="xs:positiveInteger" minOccurs="1"
|
129
|
+
maxOccurs="1">
|
130
|
+
<xs:annotation>
|
131
|
+
<xs:documentation xml:lang="en">
|
132
|
+
Dataset version number.
|
133
|
+
</xs:documentation>
|
134
|
+
</xs:annotation>
|
135
|
+
</xs:element>
|
136
|
+
<xs:element name="date" type="xs:date" minOccurs="1" maxOccurs="1">
|
137
|
+
<xs:annotation>
|
138
|
+
<xs:documentation xml:lang="en">
|
139
|
+
Dataset version date, YYYY-MM-DD.
|
140
|
+
</xs:documentation>
|
141
|
+
</xs:annotation>
|
142
|
+
</xs:element>
|
143
|
+
<xs:element name="note" type="xs:string" minOccurs="0" maxOccurs="1">
|
144
|
+
<xs:annotation>
|
145
|
+
<xs:documentation xml:lang="en">
|
146
|
+
Optional dataset version note describing the conditions leading
|
147
|
+
to the creation of version.
|
148
|
+
</xs:documentation>
|
149
|
+
</xs:annotation>
|
150
|
+
</xs:element>
|
151
|
+
</xs:sequence>
|
152
|
+
</xs:complexType>
|
153
|
+
|
154
|
+
<xs:complexType name="license_type">
|
155
|
+
<xs:annotation>
|
156
|
+
<xs:documentation xml:lang="en">
|
157
|
+
Dataset license type.
|
158
|
+
</xs:documentation>
|
159
|
+
</xs:annotation>
|
160
|
+
<xs:sequence>
|
161
|
+
<xs:element name="name" type="xs:string" minOccurs="1" maxOccurs="1">
|
162
|
+
<xs:annotation>
|
163
|
+
<xs:documentation xml:lang="en">
|
164
|
+
Dataset license name.
|
165
|
+
</xs:documentation>
|
166
|
+
</xs:annotation>
|
167
|
+
</xs:element>
|
168
|
+
<xs:element name="uri" type="xs:anyURI" minOccurs="1" maxOccurs="1">
|
169
|
+
<xs:annotation>
|
170
|
+
<xs:documentation xml:lang="en">
|
171
|
+
Dataset license URI.
|
172
|
+
</xs:documentation>
|
173
|
+
</xs:annotation>
|
174
|
+
</xs:element>
|
175
|
+
</xs:sequence>
|
176
|
+
</xs:complexType>
|
177
|
+
|
178
|
+
<xs:complexType name="embargo_type">
|
179
|
+
<xs:annotation>
|
180
|
+
<xs:documentation xml:lang="en">
|
181
|
+
Dataset embargo type.
|
182
|
+
</xs:documentation>
|
183
|
+
</xs:annotation>
|
184
|
+
<xs:sequence>
|
185
|
+
<xs:element name="type" type="embargo_type_type" minOccurs="1" maxOccurs="1">
|
186
|
+
<xs:annotation>
|
187
|
+
<xs:documentation xml:lang="en">
|
188
|
+
Dataset embargo type.
|
189
|
+
</xs:documentation>
|
190
|
+
</xs:annotation>
|
191
|
+
</xs:element>
|
192
|
+
<xs:element name="period" type="xs:string" minOccurs="1" maxOccurs="1">
|
193
|
+
<xs:annotation>
|
194
|
+
<xs:documentation xml:lang="en">
|
195
|
+
Dataset emabargo period, i.e., a textual description of the
|
196
|
+
period, e.g., "6 months". If the embargo type is "none", this
|
197
|
+
value is ignored, but should be set to "none".
|
198
|
+
</xs:documentation>
|
199
|
+
</xs:annotation>
|
200
|
+
</xs:element>
|
201
|
+
<xs:element name="start" type="xs:date" minOccurs="1" maxOccurs="1">
|
202
|
+
<xs:annotation>
|
203
|
+
<xs:documentation xml:lang="en">
|
204
|
+
Dataset embargo start date. This should be set to the date
|
205
|
+
at which the embargo (and Stash wrapper instance document) is
|
206
|
+
created.
|
207
|
+
</xs:documentation>
|
208
|
+
</xs:annotation>
|
209
|
+
</xs:element>
|
210
|
+
<xs:element name="end" type="xs:date" minOccurs="1" maxOccurs="1">
|
211
|
+
<xs:annotation>
|
212
|
+
<xs:documentation xml:lang="en">
|
213
|
+
Dataset embargo end date. If the embargo type is "none", this
|
214
|
+
value is ignored, but should be set to the start date.
|
215
|
+
</xs:documentation>
|
216
|
+
</xs:annotation>
|
217
|
+
</xs:element>
|
218
|
+
</xs:sequence>
|
219
|
+
</xs:complexType>
|
220
|
+
|
221
|
+
<xs:simpleType name="embargo_type_type">
|
222
|
+
<xs:annotation>
|
223
|
+
<xs:documentation xml:lang="en">
|
224
|
+
Dataset embargo type: none, download, description.
|
225
|
+
</xs:documentation>
|
226
|
+
</xs:annotation>
|
227
|
+
<xs:restriction base="xs:string">
|
228
|
+
<xs:enumeration value="none"/>
|
229
|
+
<xs:enumeration value="download"/>
|
230
|
+
<xs:enumeration value="description"/>
|
231
|
+
</xs:restriction>
|
232
|
+
</xs:simpleType>
|
233
|
+
|
234
|
+
<xs:complexType name="inventory_type">
|
235
|
+
<xs:annotation>
|
236
|
+
<xs:documentation xml:lang="en">
|
237
|
+
Dataset file inventory type.
|
238
|
+
</xs:documentation>
|
239
|
+
</xs:annotation>
|
240
|
+
<xs:sequence>
|
241
|
+
<xs:element name="file" type="file_type" minOccurs="0" maxOccurs="unbounded">
|
242
|
+
<xs:annotation>
|
243
|
+
<xs:documentation xml:lang="en">
|
244
|
+
Dataset submission package file.
|
245
|
+
</xs:documentation>
|
246
|
+
</xs:annotation>
|
247
|
+
</xs:element>
|
248
|
+
</xs:sequence>
|
249
|
+
<xs:attribute name="num_files" type="xs:nonNegativeInteger">
|
250
|
+
<xs:annotation>
|
251
|
+
<xs:documentation xml:lang="en">
|
252
|
+
Number of files in the submission package inventory.
|
253
|
+
</xs:documentation>
|
254
|
+
</xs:annotation>
|
255
|
+
</xs:attribute>
|
256
|
+
</xs:complexType>
|
257
|
+
|
258
|
+
<xs:complexType name="file_type">
|
259
|
+
<xs:annotation>
|
260
|
+
<xs:documentation xml:lang="en">
|
261
|
+
Dataset inventory file type.
|
262
|
+
</xs:documentation>
|
263
|
+
</xs:annotation>
|
264
|
+
<xs:sequence>
|
265
|
+
<xs:element name="pathname" type="xs:string" minOccurs="1" maxOccurs="1">
|
266
|
+
<xs:annotation>
|
267
|
+
<xs:documentation xml:lang="en">
|
268
|
+
Dataset file pathname.
|
269
|
+
</xs:documentation>
|
270
|
+
</xs:annotation>
|
271
|
+
</xs:element>
|
272
|
+
|
273
|
+
<xs:element name="size" type="size_type" minOccurs="1" maxOccurs="1">
|
274
|
+
<xs:annotation>
|
275
|
+
<xs:documentation xml:lang="en">
|
276
|
+
Dataset file size, as an integer.
|
277
|
+
</xs:documentation>
|
278
|
+
</xs:annotation>
|
279
|
+
</xs:element>
|
280
|
+
|
281
|
+
<xs:element name="mime_type" type="xs:string" minOccurs="1" maxOccurs="1">
|
282
|
+
<xs:annotation>
|
283
|
+
<xs:documentation xml:lang="en">
|
284
|
+
Dataset file MIME type.
|
285
|
+
</xs:documentation>
|
286
|
+
</xs:annotation>
|
287
|
+
</xs:element>
|
288
|
+
</xs:sequence>
|
289
|
+
</xs:complexType>
|
290
|
+
|
291
|
+
<xs:complexType name="size_type">
|
292
|
+
<xs:annotation>
|
293
|
+
<xs:documentation xml:lang="en">
|
294
|
+
Dataset file size type.
|
295
|
+
</xs:documentation>
|
296
|
+
</xs:annotation>
|
297
|
+
<xs:simpleContent>
|
298
|
+
<xs:extension base="xs:nonNegativeInteger">
|
299
|
+
<xs:attribute name="unit">
|
300
|
+
<xs:simpleType>
|
301
|
+
<xs:restriction base="xs:string">
|
302
|
+
<xs:enumeration value="B"/>
|
303
|
+
</xs:restriction>
|
304
|
+
</xs:simpleType>
|
305
|
+
</xs:attribute>
|
306
|
+
</xs:extension>
|
307
|
+
</xs:simpleContent>
|
308
|
+
</xs:complexType>
|
309
|
+
|
310
|
+
<xs:complexType name="stash_descriptive_type">
|
311
|
+
<xs:annotation>
|
312
|
+
<xs:documentation xml:lang="en">
|
313
|
+
Stash descriptive metadata wrapper type. This contains arbitrary well-formed
|
314
|
+
XML conforming to the configured descriptive schema.
|
315
|
+
</xs:documentation>
|
316
|
+
</xs:annotation>
|
317
|
+
<xs:sequence>
|
318
|
+
<xs:any namespace="##any" processContents="lax" minOccurs="0"
|
319
|
+
maxOccurs="unbounded"/>
|
320
|
+
</xs:sequence>
|
321
|
+
</xs:complexType>
|
322
|
+
</xs:schema>
|
@@ -0,0 +1,56 @@
|
|
1
|
+
<?xml version="1.0" encoding="UTF-8"?>
|
2
|
+
<st:stash_wrapper xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
|
3
|
+
xsi:schemaLocation="http://dash.cdlib.org/stash_wrapper/ http://dash.cdlib.org/stash_wrapper/stash_wrapper.xsd"
|
4
|
+
xmlns:st="http://dash.cdlib.org/stash_wrapper/">
|
5
|
+
<st:identifier type="DOI">10.12345/1234567890</st:identifier>
|
6
|
+
<st:stash_administrative>
|
7
|
+
<st:version>
|
8
|
+
<st:version_number>1</st:version_number>
|
9
|
+
<st:date>2015-09-08</st:date>
|
10
|
+
</st:version>
|
11
|
+
<st:license>
|
12
|
+
<st:name>Creative Commons Attribution 4.0 International (CC-BY)</st:name>
|
13
|
+
<st:uri>https://creativecommons.org/licenses/by/4.0/legalcode</st:uri>
|
14
|
+
</st:license>
|
15
|
+
<st:embargo>
|
16
|
+
<st:type>download</st:type>
|
17
|
+
<st:period>6 months</st:period>
|
18
|
+
<st:start>2015-09-08</st:start>
|
19
|
+
<st:end>2016-03-07</st:end>
|
20
|
+
</st:embargo>
|
21
|
+
<st:inventory num_files="1">
|
22
|
+
<st:file>
|
23
|
+
<st:pathname>mydata.xlsx</st:pathname>
|
24
|
+
<st:size unit="B">12345678</st:size>
|
25
|
+
<st:mime_type>application/vnd.openxmlformats-officedocument.spreadsheetml.sheet</st:mime_type>
|
26
|
+
</st:file>
|
27
|
+
</st:inventory>
|
28
|
+
</st:stash_administrative>
|
29
|
+
<st:stash_descriptive>
|
30
|
+
<dcs:resource xmlns:dcs="http://datacite.org/schema/kernel-3"
|
31
|
+
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
|
32
|
+
xsi:schemaLocation="http://datacite.org/schema/kernel-3
|
33
|
+
http://schema.datacite.org/meta/kernel-3/metadata.xsd">
|
34
|
+
<dcs:identifier identifierType="DOI">10.12345/1234567890</dcs:identifier>
|
35
|
+
<dcs:creators>
|
36
|
+
<dcs:creator>
|
37
|
+
<dcs:creatorName>Abrams, Stephen</dcs:creatorName>
|
38
|
+
</dcs:creator>
|
39
|
+
</dcs:creators>
|
40
|
+
<dcs:titles>
|
41
|
+
<dcs:title>My dataset</dcs:title>
|
42
|
+
</dcs:titles>
|
43
|
+
<dcs:publisher>UC Office of the President</dcs:publisher>
|
44
|
+
<dcs:publicationYear>2016</dcs:publicationYear>
|
45
|
+
<dcs:subjects>
|
46
|
+
<dcs:subject>Data literacy</dcs:subject>
|
47
|
+
</dcs:subjects>
|
48
|
+
<dcs:resourceType resourceTypeGeneral="Dataset">Spreadsheet</dcs:resourceType>
|
49
|
+
<dcs:descriptions>
|
50
|
+
<dcs:description descriptionType="Abstract">
|
51
|
+
Lorum ipsum.
|
52
|
+
</dcs:description>
|
53
|
+
</dcs:descriptions>
|
54
|
+
</dcs:resource>
|
55
|
+
</st:stash_descriptive>
|
56
|
+
</st:stash_wrapper>
|
@@ -0,0 +1,88 @@
|
|
1
|
+
<?xml version="1.0" encoding="UTF-8"?>
|
2
|
+
<resource xmlns='http://datacite.org/schema/kernel-3' xmlns:xsi='http://www.w3.org/2001/XMLSchema-instance'
|
3
|
+
xsi:schemaLocation='http://datacite.org/schema/kernel-3 http://schema.datacite.org/meta/kernel-3/metadata.xsd'>
|
4
|
+
<identifier identifierType='DOI'>10.14749/1407399498</identifier>
|
5
|
+
<creators>
|
6
|
+
<creator>
|
7
|
+
<creatorName>Zuma, Khangelani</creatorName>
|
8
|
+
</creator>
|
9
|
+
<creator>
|
10
|
+
<creatorName>Human Sciences Research Council</creatorName>
|
11
|
+
</creator>
|
12
|
+
</creators>
|
13
|
+
<titles>
|
14
|
+
<title xml:lang='en'>HSRC Master Sample II</title>
|
15
|
+
</titles>
|
16
|
+
<publisher>HSRC - Human Science Research Council SA</publisher>
|
17
|
+
<publicationYear>2014</publicationYear>
|
18
|
+
<contributors>
|
19
|
+
<contributor contributorType='Distributor'>
|
20
|
+
<contributorName>Human Sciences Research Council</contributorName>
|
21
|
+
</contributor>
|
22
|
+
<contributor contributorType='Funder'>
|
23
|
+
<contributorName>Human Sciences Research Council</contributorName>
|
24
|
+
</contributor>
|
25
|
+
<contributor contributorType='RightsHolder'>
|
26
|
+
<contributorName>Human Sciences Research Council</contributorName>
|
27
|
+
</contributor>
|
28
|
+
</contributors>
|
29
|
+
<language>eng</language>
|
30
|
+
<resourceType resourceTypeGeneral='Dataset'/>
|
31
|
+
<version>1.0</version>
|
32
|
+
<rightsList>
|
33
|
+
<rights>
|
34
|
+
By accessing the data, you give assurance that The data and documentation will not be duplicated, redistributed or sold without prior approval from
|
35
|
+
the rights holder. The data will be used for scientific research or educational purposes only. The data will only be used for the specified
|
36
|
+
purpose. If it is used for another purpose the additional purpose will be registered. Redundant data files will be destroyed. The confidentiality of
|
37
|
+
individuals/organisations in the data will be preserved at all times. No attempt will be made to obtain or derive information from the data to
|
38
|
+
identify individuals/organisations. The HSRC will be acknowledged in all published and unpublished works based on the data according to the provided
|
39
|
+
citation. The HSRC will be informed of any books, articles, conference papers, theses, dissertations, reports or other publications resulting from
|
40
|
+
work based in whole or in part on the data and documentation. For archiving and bibliographic purposes an electronic copy of all reports and
|
41
|
+
publications based on the requested data will be sent to the HSRC. To offer for deposit into the HSRC Data Collection any new data sets which have
|
42
|
+
been derived from or which have been created by the combination of the data supplied with other data. The data team bears no responsibility for use of
|
43
|
+
the data or for interpretations or inferences based upon such uses. Failure to comply with the End User License may result in sanctions being imposed.
|
44
|
+
</rights>
|
45
|
+
</rightsList>
|
46
|
+
<descriptions>
|
47
|
+
<description descriptionType='Abstract' xml:lang='en'>
|
48
|
+
<p> The 2005 HSRC Master Sample was used for SABSSM 2008 and 2012, the SANHANES study in 2012 and SASAS 2007-2010 (adjacent EAs) to obtain an
|
49
|
+
understanding of geographical spread of HIV/AIDS, perceptions and attitudes of people and other health related studies over time.</p>
|
50
|
+
</description>
|
51
|
+
<description descriptionType='Abstract' xml:lang='en'>
|
52
|
+
<p> A sample can be defined as a subset containing the characteristics of a larger population. Samples are used in statistical testing when
|
53
|
+
population sizes are too large for the test to include all possible members or observations. A sample should represent the whole population and not
|
54
|
+
reflect bias toward a specific attribute.[1]</p> <p> One of the most crucial aspects of sample design in household surveys is its
|
55
|
+
frame. The sampling frame has significant implications on the cost and the quality of any survey, household or otherwise.[2]</p> <p> The
|
56
|
+
sampling frame .... in a household survey must cover the entire target population. When that frame is used for multiple surveys or multiple rounds of
|
57
|
+
the same survey it is known as a master sample frame or .... master sample.[3]</p> <p> A master sample is a sample drawn from a population
|
58
|
+
for use on a number of future occasions, so as to avoid ad hoc sampling on each occasion. Sometimes the master sample is large and subsequent
|
59
|
+
inquiries are based on a sub-sample from it.[4]</p> <p> The HSRC compiles master samples in order to construct samples for various HSRC
|
60
|
+
research studies. The 2005 HSRC Master Sample was used for SABSSM 2008 and 2012, SASAS 2007-2010 and the SANHANES study in 2012 to obtain an
|
61
|
+
understanding of geographical spread of HIV/AIDS, perceptions and attitudes of people and other health related studies over time.</p> <p>
|
62
|
+
The 2005 HSRC Master Sample was created in the following way:</p> <p> South Africa was delineated into EAs according to municipality and
|
63
|
+
province. Municipal boundaries were obtained from the Municipal Demarcation Board. An Enumeration area (EA) is the smallest geographical unit (piece
|
64
|
+
of land) into which the country is divided for census or survey enumeration.[5] The concepts and definitions of terms used for Census 2001 comply in
|
65
|
+
most instances with United Nations standards for censuses.</p> <p> A total of 1,000 census enumeration areas (EAs) from the 2001
|
66
|
+
population census were randomly selected using probability proportional to size and stratified by province, locality type and race in urban areas from
|
67
|
+
a database of 80 787 EAs that were mapped using aerial photography to develop an HSRC master sample for selecting households.</p> <p> The
|
68
|
+
ideal frame would be complete with respect to the target population if all of its members (the universe) are covered by the frame.</p> <p>
|
69
|
+
Ideal characteristics of a master sample:</p> <ul> <li> The master frame should be as complete, accurate and current as
|
70
|
+
practicable.</li> <li> A master sample frame for household surveys is typically developed from the most recent census, just as a regular
|
71
|
+
sample frame is.</li> <li> Because the master frame may be used during an entire intercensal (between census) period, however, it will
|
72
|
+
usually require periodic and regular updating such as every 2-3 years.</li> <li> This is in contrast to a regular frame which is more
|
73
|
+
likely to be up-dated on an ad hoc basis and only when a particular survey is being planned[6]</li> </ul> <p> [1]
|
74
|
+
http://www.investopedia.com/terms/s/sample.asp</p> <p> [2]
|
75
|
+
http://unstats.un.org/unsd/demographic/meetings/egm/sampling_1203/docs/no_3.pdf</p> <p> [3]
|
76
|
+
http://unstats.un.org/unsd/demographic/meetings/egm/sampling_1203/docs/no_3.pdf</p> <p> [4] A Dictionary of Statistical Terms, 5th
|
77
|
+
edition, prepared for the International Statistical Institute by F.H.C. Marriott. Published for the International Statistical Institute by Longman
|
78
|
+
Scientific and Technical. http://stats.oecd.org/glossary/detail.asp?ID=3708</p> <p> [5]
|
79
|
+
http://africageodownloads.info/128_mokgokolo.pdf</p> <p> [6]
|
80
|
+
http://unstats.un.org/unsd/demographic/meetings/egm/sampling_1203/docs/no_3.pdf</p>
|
81
|
+
</description>
|
82
|
+
</descriptions>
|
83
|
+
<geoLocations>
|
84
|
+
<geoLocation>
|
85
|
+
<geoLocationPlace>National - all 9 provinces</geoLocationPlace>
|
86
|
+
</geoLocation>
|
87
|
+
</geoLocations>
|
88
|
+
</resource>
|