carrot-transform 0.3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of carrot-transform might be problematic. Click here for more details.
- carrot_transform-0.3.dist-info/LICENSE +21 -0
- carrot_transform-0.3.dist-info/METADATA +28 -0
- carrot_transform-0.3.dist-info/RECORD +19 -0
- carrot_transform-0.3.dist-info/WHEEL +5 -0
- carrot_transform-0.3.dist-info/entry_points.txt +2 -0
- carrot_transform-0.3.dist-info/top_level.txt +1 -0
- carrottransform/__init__.py +5 -0
- carrottransform/_version.py +2 -0
- carrottransform/cli/__init__.py +0 -0
- carrottransform/cli/command.py +21 -0
- carrottransform/cli/subcommands/__init__.py +0 -0
- carrottransform/cli/subcommands/run.py +484 -0
- carrottransform/config/OMOPCDM_postgresql_5.3_ddl.sql +508 -0
- carrottransform/config/omop.json +61 -0
- carrottransform/tools/__init__.py +17 -0
- carrottransform/tools/file_helpers.py +14 -0
- carrottransform/tools/mappingrules.py +157 -0
- carrottransform/tools/metrics.py +127 -0
- carrottransform/tools/omopcdm.py +182 -0
|
@@ -0,0 +1,508 @@
|
|
|
1
|
+
--postgresql CDM DDL Specification for OMOP Common Data Model 5.3
|
|
2
|
+
|
|
3
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
4
|
+
CREATE TABLE @cdmDatabaseSchema.PERSON (
|
|
5
|
+
person_id integer NOT NULL,
|
|
6
|
+
gender_concept_id integer NOT NULL,
|
|
7
|
+
year_of_birth integer NOT NULL,
|
|
8
|
+
month_of_birth integer NULL,
|
|
9
|
+
day_of_birth integer NULL,
|
|
10
|
+
birth_datetime TIMESTAMP NULL,
|
|
11
|
+
race_concept_id integer NOT NULL,
|
|
12
|
+
ethnicity_concept_id integer NOT NULL,
|
|
13
|
+
location_id integer NULL,
|
|
14
|
+
provider_id integer NULL,
|
|
15
|
+
care_site_id integer NULL,
|
|
16
|
+
person_source_value varchar(50) NULL,
|
|
17
|
+
gender_source_value varchar(50) NULL,
|
|
18
|
+
gender_source_concept_id integer NULL,
|
|
19
|
+
race_source_value varchar(50) NULL,
|
|
20
|
+
race_source_concept_id integer NULL,
|
|
21
|
+
ethnicity_source_value varchar(50) NULL,
|
|
22
|
+
ethnicity_source_concept_id integer NULL );
|
|
23
|
+
|
|
24
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
25
|
+
CREATE TABLE @cdmDatabaseSchema.OBSERVATION_PERIOD (
|
|
26
|
+
observation_period_id integer NOT NULL,
|
|
27
|
+
person_id integer NOT NULL,
|
|
28
|
+
observation_period_start_date date NOT NULL,
|
|
29
|
+
observation_period_end_date date NOT NULL,
|
|
30
|
+
period_type_concept_id integer NOT NULL );
|
|
31
|
+
|
|
32
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
33
|
+
CREATE TABLE @cdmDatabaseSchema.VISIT_OCCURRENCE (
|
|
34
|
+
visit_occurrence_id integer NOT NULL,
|
|
35
|
+
person_id integer NOT NULL,
|
|
36
|
+
visit_concept_id integer NOT NULL,
|
|
37
|
+
visit_start_date date NOT NULL,
|
|
38
|
+
visit_start_datetime TIMESTAMP NULL,
|
|
39
|
+
visit_end_date date NOT NULL,
|
|
40
|
+
visit_end_datetime TIMESTAMP NULL,
|
|
41
|
+
visit_type_concept_id Integer NOT NULL,
|
|
42
|
+
provider_id integer NULL,
|
|
43
|
+
care_site_id integer NULL,
|
|
44
|
+
visit_source_value varchar(50) NULL,
|
|
45
|
+
visit_source_concept_id integer NULL,
|
|
46
|
+
admitting_source_concept_id integer NULL,
|
|
47
|
+
admitting_source_value varchar(50) NULL,
|
|
48
|
+
discharge_to_concept_id integer NULL,
|
|
49
|
+
discharge_to_source_value varchar(50) NULL,
|
|
50
|
+
preceding_visit_occurrence_id integer NULL );
|
|
51
|
+
|
|
52
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
53
|
+
CREATE TABLE @cdmDatabaseSchema.VISIT_DETAIL (
|
|
54
|
+
visit_detail_id integer NOT NULL,
|
|
55
|
+
person_id integer NOT NULL,
|
|
56
|
+
visit_detail_concept_id integer NOT NULL,
|
|
57
|
+
visit_detail_start_date date NOT NULL,
|
|
58
|
+
visit_detail_start_datetime TIMESTAMP NULL,
|
|
59
|
+
visit_detail_end_date date NOT NULL,
|
|
60
|
+
visit_detail_end_datetime TIMESTAMP NULL,
|
|
61
|
+
visit_detail_type_concept_id integer NOT NULL,
|
|
62
|
+
provider_id integer NULL,
|
|
63
|
+
care_site_id integer NULL,
|
|
64
|
+
visit_detail_source_value varchar(50) NULL,
|
|
65
|
+
visit_detail_source_concept_id Integer NULL,
|
|
66
|
+
admitting_source_value Varchar(50) NULL,
|
|
67
|
+
admitting_source_concept_id Integer NULL,
|
|
68
|
+
discharge_to_source_value Varchar(50) NULL,
|
|
69
|
+
discharge_to_concept_id integer NULL,
|
|
70
|
+
preceding_visit_detail_id integer NULL,
|
|
71
|
+
visit_detail_parent_id integer NULL,
|
|
72
|
+
visit_occurrence_id integer NOT NULL );
|
|
73
|
+
|
|
74
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
75
|
+
CREATE TABLE @cdmDatabaseSchema.CONDITION_OCCURRENCE (
|
|
76
|
+
condition_occurrence_id integer NOT NULL,
|
|
77
|
+
person_id integer NOT NULL,
|
|
78
|
+
condition_concept_id integer NOT NULL,
|
|
79
|
+
condition_start_date date NOT NULL,
|
|
80
|
+
condition_start_datetime TIMESTAMP NULL,
|
|
81
|
+
condition_end_date date NULL,
|
|
82
|
+
condition_end_datetime TIMESTAMP NULL,
|
|
83
|
+
condition_type_concept_id integer NOT NULL,
|
|
84
|
+
condition_status_concept_id integer NULL,
|
|
85
|
+
stop_reason varchar(20) NULL,
|
|
86
|
+
provider_id integer NULL,
|
|
87
|
+
visit_occurrence_id integer NULL,
|
|
88
|
+
visit_detail_id integer NULL,
|
|
89
|
+
condition_source_value varchar(50) NULL,
|
|
90
|
+
condition_source_concept_id integer NULL,
|
|
91
|
+
condition_status_source_value varchar(50) NULL );
|
|
92
|
+
|
|
93
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
94
|
+
CREATE TABLE @cdmDatabaseSchema.DRUG_EXPOSURE (
|
|
95
|
+
drug_exposure_id integer NOT NULL,
|
|
96
|
+
person_id integer NOT NULL,
|
|
97
|
+
drug_concept_id integer NOT NULL,
|
|
98
|
+
drug_exposure_start_date date NOT NULL,
|
|
99
|
+
drug_exposure_start_datetime TIMESTAMP NULL,
|
|
100
|
+
drug_exposure_end_date date NOT NULL,
|
|
101
|
+
drug_exposure_end_datetime TIMESTAMP NULL,
|
|
102
|
+
verbatim_end_date date NULL,
|
|
103
|
+
drug_type_concept_id integer NOT NULL,
|
|
104
|
+
stop_reason varchar(20) NULL,
|
|
105
|
+
refills integer NULL,
|
|
106
|
+
quantity NUMERIC NULL,
|
|
107
|
+
days_supply integer NULL,
|
|
108
|
+
sig TEXT NULL,
|
|
109
|
+
route_concept_id integer NULL,
|
|
110
|
+
lot_number varchar(50) NULL,
|
|
111
|
+
provider_id integer NULL,
|
|
112
|
+
visit_occurrence_id integer NULL,
|
|
113
|
+
visit_detail_id integer NULL,
|
|
114
|
+
drug_source_value varchar(50) NULL,
|
|
115
|
+
drug_source_concept_id integer NULL,
|
|
116
|
+
route_source_value varchar(50) NULL,
|
|
117
|
+
dose_unit_source_value varchar(50) NULL );
|
|
118
|
+
|
|
119
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
120
|
+
CREATE TABLE @cdmDatabaseSchema.PROCEDURE_OCCURRENCE (
|
|
121
|
+
procedure_occurrence_id integer NOT NULL,
|
|
122
|
+
person_id integer NOT NULL,
|
|
123
|
+
procedure_concept_id integer NOT NULL,
|
|
124
|
+
procedure_date date NOT NULL,
|
|
125
|
+
procedure_datetime TIMESTAMP NULL,
|
|
126
|
+
procedure_type_concept_id integer NOT NULL,
|
|
127
|
+
modifier_concept_id integer NULL,
|
|
128
|
+
quantity integer NULL,
|
|
129
|
+
provider_id integer NULL,
|
|
130
|
+
visit_occurrence_id integer NULL,
|
|
131
|
+
visit_detail_id integer NULL,
|
|
132
|
+
procedure_source_value varchar(50) NULL,
|
|
133
|
+
procedure_source_concept_id integer NULL,
|
|
134
|
+
modifier_source_value varchar(50) NULL );
|
|
135
|
+
|
|
136
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
137
|
+
CREATE TABLE @cdmDatabaseSchema.DEVICE_EXPOSURE (
|
|
138
|
+
device_exposure_id integer NOT NULL,
|
|
139
|
+
person_id integer NOT NULL,
|
|
140
|
+
device_concept_id integer NOT NULL,
|
|
141
|
+
device_exposure_start_date date NOT NULL,
|
|
142
|
+
device_exposure_start_datetime TIMESTAMP NULL,
|
|
143
|
+
device_exposure_end_date date NULL,
|
|
144
|
+
device_exposure_end_datetime TIMESTAMP NULL,
|
|
145
|
+
device_type_concept_id integer NOT NULL,
|
|
146
|
+
unique_device_id varchar(50) NULL,
|
|
147
|
+
quantity integer NULL,
|
|
148
|
+
provider_id integer NULL,
|
|
149
|
+
visit_occurrence_id integer NULL,
|
|
150
|
+
visit_detail_id integer NULL,
|
|
151
|
+
device_source_value varchar(50) NULL,
|
|
152
|
+
device_source_concept_id integer NULL );
|
|
153
|
+
|
|
154
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
155
|
+
CREATE TABLE @cdmDatabaseSchema.MEASUREMENT (
|
|
156
|
+
measurement_id integer NOT NULL,
|
|
157
|
+
person_id integer NOT NULL,
|
|
158
|
+
measurement_concept_id integer NOT NULL,
|
|
159
|
+
measurement_date date NOT NULL,
|
|
160
|
+
measurement_datetime TIMESTAMP NULL,
|
|
161
|
+
measurement_time varchar(10) NULL,
|
|
162
|
+
measurement_type_concept_id integer NOT NULL,
|
|
163
|
+
operator_concept_id integer NULL,
|
|
164
|
+
value_as_number NUMERIC NULL,
|
|
165
|
+
value_as_concept_id integer NULL,
|
|
166
|
+
unit_concept_id integer NULL,
|
|
167
|
+
range_low NUMERIC NULL,
|
|
168
|
+
range_high NUMERIC NULL,
|
|
169
|
+
provider_id integer NULL,
|
|
170
|
+
visit_occurrence_id integer NULL,
|
|
171
|
+
visit_detail_id integer NULL,
|
|
172
|
+
measurement_source_value varchar(50) NULL,
|
|
173
|
+
measurement_source_concept_id integer NULL,
|
|
174
|
+
unit_source_value varchar(50) NULL,
|
|
175
|
+
value_source_value varchar(50) NULL );
|
|
176
|
+
|
|
177
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
178
|
+
CREATE TABLE @cdmDatabaseSchema.OBSERVATION (
|
|
179
|
+
observation_id integer NOT NULL,
|
|
180
|
+
person_id integer NOT NULL,
|
|
181
|
+
observation_concept_id integer NOT NULL,
|
|
182
|
+
observation_date date NOT NULL,
|
|
183
|
+
observation_datetime TIMESTAMP NULL,
|
|
184
|
+
observation_type_concept_id integer NOT NULL,
|
|
185
|
+
value_as_number NUMERIC NULL,
|
|
186
|
+
value_as_string varchar(60) NULL,
|
|
187
|
+
value_as_concept_id Integer NULL,
|
|
188
|
+
qualifier_concept_id integer NULL,
|
|
189
|
+
unit_concept_id integer NULL,
|
|
190
|
+
provider_id integer NULL,
|
|
191
|
+
visit_occurrence_id integer NULL,
|
|
192
|
+
visit_detail_id integer NULL,
|
|
193
|
+
observation_source_value varchar(50) NULL,
|
|
194
|
+
observation_source_concept_id integer NULL,
|
|
195
|
+
unit_source_value varchar(50) NULL,
|
|
196
|
+
qualifier_source_value varchar(50) NULL );
|
|
197
|
+
|
|
198
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
199
|
+
CREATE TABLE @cdmDatabaseSchema.DEATH (
|
|
200
|
+
person_id integer NOT NULL,
|
|
201
|
+
death_date date NOT NULL,
|
|
202
|
+
death_datetime TIMESTAMP NULL,
|
|
203
|
+
death_type_concept_id integer NULL,
|
|
204
|
+
cause_concept_id integer NULL,
|
|
205
|
+
cause_source_value varchar(50) NULL,
|
|
206
|
+
cause_source_concept_id integer NULL );
|
|
207
|
+
|
|
208
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
209
|
+
CREATE TABLE @cdmDatabaseSchema.NOTE (
|
|
210
|
+
note_id integer NOT NULL,
|
|
211
|
+
person_id integer NOT NULL,
|
|
212
|
+
note_date date NOT NULL,
|
|
213
|
+
note_datetime TIMESTAMP NULL,
|
|
214
|
+
note_type_concept_id integer NOT NULL,
|
|
215
|
+
note_class_concept_id integer NOT NULL,
|
|
216
|
+
note_title varchar(250) NULL,
|
|
217
|
+
note_text TEXT NOT NULL,
|
|
218
|
+
encoding_concept_id integer NOT NULL,
|
|
219
|
+
language_concept_id integer NOT NULL,
|
|
220
|
+
provider_id integer NULL,
|
|
221
|
+
visit_occurrence_id integer NULL,
|
|
222
|
+
visit_detail_id integer NULL,
|
|
223
|
+
note_source_value varchar(50) NULL );
|
|
224
|
+
|
|
225
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
226
|
+
CREATE TABLE @cdmDatabaseSchema.NOTE_NLP (
|
|
227
|
+
note_nlp_id integer NOT NULL,
|
|
228
|
+
note_id integer NOT NULL,
|
|
229
|
+
section_concept_id integer NULL,
|
|
230
|
+
snippet varchar(250) NULL,
|
|
231
|
+
"offset" varchar(50) NULL,
|
|
232
|
+
lexical_variant varchar(250) NOT NULL,
|
|
233
|
+
note_nlp_concept_id integer NULL,
|
|
234
|
+
note_nlp_source_concept_id integer NULL,
|
|
235
|
+
nlp_system varchar(250) NULL,
|
|
236
|
+
nlp_date date NOT NULL,
|
|
237
|
+
nlp_datetime TIMESTAMP NULL,
|
|
238
|
+
term_exists varchar(1) NULL,
|
|
239
|
+
term_temporal varchar(50) NULL,
|
|
240
|
+
term_modifiers varchar(2000) NULL );
|
|
241
|
+
|
|
242
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
243
|
+
CREATE TABLE @cdmDatabaseSchema.SPECIMEN (
|
|
244
|
+
specimen_id integer NOT NULL,
|
|
245
|
+
person_id integer NOT NULL,
|
|
246
|
+
specimen_concept_id integer NOT NULL,
|
|
247
|
+
specimen_type_concept_id integer NOT NULL,
|
|
248
|
+
specimen_date date NOT NULL,
|
|
249
|
+
specimen_datetime TIMESTAMP NULL,
|
|
250
|
+
quantity NUMERIC NULL,
|
|
251
|
+
unit_concept_id integer NULL,
|
|
252
|
+
anatomic_site_concept_id integer NULL,
|
|
253
|
+
disease_status_concept_id integer NULL,
|
|
254
|
+
specimen_source_id varchar(50) NULL,
|
|
255
|
+
specimen_source_value varchar(50) NULL,
|
|
256
|
+
unit_source_value varchar(50) NULL,
|
|
257
|
+
anatomic_site_source_value varchar(50) NULL,
|
|
258
|
+
disease_status_source_value varchar(50) NULL );
|
|
259
|
+
|
|
260
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
261
|
+
CREATE TABLE @cdmDatabaseSchema.FACT_RELATIONSHIP (
|
|
262
|
+
domain_concept_id_1 integer NOT NULL,
|
|
263
|
+
fact_id_1 integer NOT NULL,
|
|
264
|
+
domain_concept_id_2 integer NOT NULL,
|
|
265
|
+
fact_id_2 integer NOT NULL,
|
|
266
|
+
relationship_concept_id integer NOT NULL );
|
|
267
|
+
|
|
268
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
269
|
+
CREATE TABLE @cdmDatabaseSchema.LOCATION (
|
|
270
|
+
location_id integer NOT NULL,
|
|
271
|
+
address_1 varchar(50) NULL,
|
|
272
|
+
address_2 varchar(50) NULL,
|
|
273
|
+
city varchar(50) NULL,
|
|
274
|
+
state varchar(2) NULL,
|
|
275
|
+
zip varchar(9) NULL,
|
|
276
|
+
county varchar(20) NULL,
|
|
277
|
+
location_source_value varchar(50) NULL );
|
|
278
|
+
|
|
279
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
280
|
+
CREATE TABLE @cdmDatabaseSchema.CARE_SITE (
|
|
281
|
+
care_site_id integer NOT NULL,
|
|
282
|
+
care_site_name varchar(255) NULL,
|
|
283
|
+
place_of_service_concept_id integer NULL,
|
|
284
|
+
location_id integer NULL,
|
|
285
|
+
care_site_source_value varchar(50) NULL,
|
|
286
|
+
place_of_service_source_value varchar(50) NULL );
|
|
287
|
+
|
|
288
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
289
|
+
CREATE TABLE @cdmDatabaseSchema.PROVIDER (
|
|
290
|
+
provider_id integer NOT NULL,
|
|
291
|
+
provider_name varchar(255) NULL,
|
|
292
|
+
npi varchar(20) NULL,
|
|
293
|
+
dea varchar(20) NULL,
|
|
294
|
+
specialty_concept_id integer NULL,
|
|
295
|
+
care_site_id integer NULL,
|
|
296
|
+
year_of_birth integer NULL,
|
|
297
|
+
gender_concept_id integer NULL,
|
|
298
|
+
provider_source_value varchar(50) NULL,
|
|
299
|
+
specialty_source_value varchar(50) NULL,
|
|
300
|
+
specialty_source_concept_id integer NULL,
|
|
301
|
+
gender_source_value varchar(50) NULL,
|
|
302
|
+
gender_source_concept_id integer NULL );
|
|
303
|
+
|
|
304
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
305
|
+
CREATE TABLE @cdmDatabaseSchema.PAYER_PLAN_PERIOD (
|
|
306
|
+
payer_plan_period_id integer NOT NULL,
|
|
307
|
+
person_id integer NOT NULL,
|
|
308
|
+
payer_plan_period_start_date date NOT NULL,
|
|
309
|
+
payer_plan_period_end_date date NOT NULL,
|
|
310
|
+
payer_concept_id integer NULL,
|
|
311
|
+
payer_source_value varchar(50) NULL,
|
|
312
|
+
payer_source_concept_id integer NULL,
|
|
313
|
+
plan_concept_id integer NULL,
|
|
314
|
+
plan_source_value varchar(50) NULL,
|
|
315
|
+
plan_source_concept_id integer NULL,
|
|
316
|
+
sponsor_concept_id integer NULL,
|
|
317
|
+
sponsor_source_value varchar(50) NULL,
|
|
318
|
+
sponsor_source_concept_id integer NULL,
|
|
319
|
+
family_source_value varchar(50) NULL,
|
|
320
|
+
stop_reason_concept_id integer NULL,
|
|
321
|
+
stop_reason_source_value varchar(50) NULL,
|
|
322
|
+
stop_reason_source_concept_id integer NULL );
|
|
323
|
+
|
|
324
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
325
|
+
CREATE TABLE @cdmDatabaseSchema.COST (
|
|
326
|
+
cost_id integer NOT NULL,
|
|
327
|
+
cost_event_id integer NOT NULL,
|
|
328
|
+
cost_domain_id varchar(20) NOT NULL,
|
|
329
|
+
cost_type_concept_id integer NOT NULL,
|
|
330
|
+
currency_concept_id integer NULL,
|
|
331
|
+
total_charge NUMERIC NULL,
|
|
332
|
+
total_cost NUMERIC NULL,
|
|
333
|
+
total_paid NUMERIC NULL,
|
|
334
|
+
paid_by_payer NUMERIC NULL,
|
|
335
|
+
paid_by_patient NUMERIC NULL,
|
|
336
|
+
paid_patient_copay NUMERIC NULL,
|
|
337
|
+
paid_patient_coinsurance NUMERIC NULL,
|
|
338
|
+
paid_patient_deductible NUMERIC NULL,
|
|
339
|
+
paid_by_primary NUMERIC NULL,
|
|
340
|
+
paid_ingredient_cost NUMERIC NULL,
|
|
341
|
+
paid_dispensing_fee NUMERIC NULL,
|
|
342
|
+
payer_plan_period_id integer NULL,
|
|
343
|
+
amount_allowed NUMERIC NULL,
|
|
344
|
+
revenue_code_concept_id integer NULL,
|
|
345
|
+
revenue_code_source_value varchar(50) NULL,
|
|
346
|
+
drg_concept_id integer NULL,
|
|
347
|
+
drg_source_value varchar(3) NULL );
|
|
348
|
+
|
|
349
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
350
|
+
CREATE TABLE @cdmDatabaseSchema.DRUG_ERA (
|
|
351
|
+
drug_era_id integer NOT NULL,
|
|
352
|
+
person_id integer NOT NULL,
|
|
353
|
+
drug_concept_id integer NOT NULL,
|
|
354
|
+
drug_era_start_date date NOT NULL,
|
|
355
|
+
drug_era_end_date date NOT NULL,
|
|
356
|
+
drug_exposure_count integer NULL,
|
|
357
|
+
gap_days integer NULL );
|
|
358
|
+
|
|
359
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
360
|
+
CREATE TABLE @cdmDatabaseSchema.DOSE_ERA (
|
|
361
|
+
dose_era_id integer NOT NULL,
|
|
362
|
+
person_id integer NOT NULL,
|
|
363
|
+
drug_concept_id integer NOT NULL,
|
|
364
|
+
unit_concept_id integer NOT NULL,
|
|
365
|
+
dose_value NUMERIC NOT NULL,
|
|
366
|
+
dose_era_start_date date NOT NULL,
|
|
367
|
+
dose_era_end_date date NOT NULL );
|
|
368
|
+
|
|
369
|
+
--HINT DISTRIBUTE ON KEY (person_id)
|
|
370
|
+
CREATE TABLE @cdmDatabaseSchema.CONDITION_ERA (
|
|
371
|
+
condition_era_id integer NOT NULL,
|
|
372
|
+
person_id integer NOT NULL,
|
|
373
|
+
condition_concept_id integer NOT NULL,
|
|
374
|
+
condition_era_start_date date NOT NULL,
|
|
375
|
+
condition_era_end_date date NOT NULL,
|
|
376
|
+
condition_occurrence_count integer NULL );
|
|
377
|
+
|
|
378
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
379
|
+
CREATE TABLE @cdmDatabaseSchema.METADATA (
|
|
380
|
+
metadata_concept_id integer NOT NULL,
|
|
381
|
+
metadata_type_concept_id integer NOT NULL,
|
|
382
|
+
name varchar(250) NOT NULL,
|
|
383
|
+
value_as_string varchar(250) NULL,
|
|
384
|
+
value_as_concept_id integer NULL,
|
|
385
|
+
metadata_date date NULL,
|
|
386
|
+
metadata_datetime TIMESTAMP NULL );
|
|
387
|
+
|
|
388
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
389
|
+
CREATE TABLE @cdmDatabaseSchema.CDM_SOURCE (
|
|
390
|
+
cdm_source_name varchar(255) NOT NULL,
|
|
391
|
+
cdm_source_abbreviation varchar(25) NULL,
|
|
392
|
+
cdm_holder varchar(255) NULL,
|
|
393
|
+
source_description TEXT NULL,
|
|
394
|
+
source_documentation_reference varchar(255) NULL,
|
|
395
|
+
cdm_etl_reference varchar(255) NULL,
|
|
396
|
+
source_release_date date NULL,
|
|
397
|
+
cdm_release_date date NULL,
|
|
398
|
+
cdm_version varchar(10) NULL,
|
|
399
|
+
vocabulary_version varchar(20) NULL );
|
|
400
|
+
|
|
401
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
402
|
+
CREATE TABLE @cdmDatabaseSchema.CONCEPT (
|
|
403
|
+
concept_id integer NOT NULL,
|
|
404
|
+
concept_name varchar(255) NOT NULL,
|
|
405
|
+
domain_id varchar(20) NOT NULL,
|
|
406
|
+
vocabulary_id varchar(20) NOT NULL,
|
|
407
|
+
concept_class_id varchar(20) NOT NULL,
|
|
408
|
+
standard_concept varchar(1) NULL,
|
|
409
|
+
concept_code varchar(50) NOT NULL,
|
|
410
|
+
valid_start_date date NOT NULL,
|
|
411
|
+
valid_end_date date NOT NULL,
|
|
412
|
+
invalid_reason varchar(1) NULL );
|
|
413
|
+
|
|
414
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
415
|
+
CREATE TABLE @cdmDatabaseSchema.VOCABULARY (
|
|
416
|
+
vocabulary_id varchar(20) NOT NULL,
|
|
417
|
+
vocabulary_name varchar(255) NOT NULL,
|
|
418
|
+
vocabulary_reference varchar(255) NOT NULL,
|
|
419
|
+
vocabulary_version varchar(255) NULL,
|
|
420
|
+
vocabulary_concept_id integer NOT NULL );
|
|
421
|
+
|
|
422
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
423
|
+
CREATE TABLE @cdmDatabaseSchema.DOMAIN (
|
|
424
|
+
domain_id varchar(20) NOT NULL,
|
|
425
|
+
domain_name varchar(255) NOT NULL,
|
|
426
|
+
domain_concept_id integer NOT NULL );
|
|
427
|
+
|
|
428
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
429
|
+
CREATE TABLE @cdmDatabaseSchema.CONCEPT_CLASS (
|
|
430
|
+
concept_class_id varchar(20) NOT NULL,
|
|
431
|
+
concept_class_name varchar(255) NOT NULL,
|
|
432
|
+
concept_class_concept_id integer NOT NULL );
|
|
433
|
+
|
|
434
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
435
|
+
CREATE TABLE @cdmDatabaseSchema.CONCEPT_RELATIONSHIP (
|
|
436
|
+
concept_id_1 integer NOT NULL,
|
|
437
|
+
concept_id_2 integer NOT NULL,
|
|
438
|
+
relationship_id varchar(20) NOT NULL,
|
|
439
|
+
valid_start_date date NOT NULL,
|
|
440
|
+
valid_end_date date NOT NULL,
|
|
441
|
+
invalid_reason varchar(1) NULL );
|
|
442
|
+
|
|
443
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
444
|
+
CREATE TABLE @cdmDatabaseSchema.RELATIONSHIP (
|
|
445
|
+
relationship_id varchar(20) NOT NULL,
|
|
446
|
+
relationship_name varchar(255) NOT NULL,
|
|
447
|
+
is_hierarchical varchar(1) NOT NULL,
|
|
448
|
+
defines_ancestry varchar(1) NOT NULL,
|
|
449
|
+
reverse_relationship_id varchar(20) NOT NULL,
|
|
450
|
+
relationship_concept_id integer NOT NULL );
|
|
451
|
+
|
|
452
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
453
|
+
CREATE TABLE @cdmDatabaseSchema.CONCEPT_SYNONYM (
|
|
454
|
+
concept_id integer NOT NULL,
|
|
455
|
+
concept_synonym_name varchar(1000) NOT NULL,
|
|
456
|
+
language_concept_id integer NOT NULL );
|
|
457
|
+
|
|
458
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
459
|
+
CREATE TABLE @cdmDatabaseSchema.CONCEPT_ANCESTOR (
|
|
460
|
+
ancestor_concept_id integer NOT NULL,
|
|
461
|
+
descendant_concept_id integer NOT NULL,
|
|
462
|
+
min_levels_of_separation integer NOT NULL,
|
|
463
|
+
max_levels_of_separation integer NOT NULL );
|
|
464
|
+
|
|
465
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
466
|
+
CREATE TABLE @cdmDatabaseSchema.SOURCE_TO_CONCEPT_MAP (
|
|
467
|
+
source_code varchar(50) NOT NULL,
|
|
468
|
+
source_concept_id integer NOT NULL,
|
|
469
|
+
source_vocabulary_id varchar(20) NOT NULL,
|
|
470
|
+
source_code_description varchar(255) NULL,
|
|
471
|
+
target_concept_id integer NOT NULL,
|
|
472
|
+
target_vocabulary_id varchar(20) NOT NULL,
|
|
473
|
+
valid_start_date date NOT NULL,
|
|
474
|
+
valid_end_date date NOT NULL,
|
|
475
|
+
invalid_reason varchar(1) NULL );
|
|
476
|
+
|
|
477
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
478
|
+
CREATE TABLE @cdmDatabaseSchema.DRUG_STRENGTH (
|
|
479
|
+
drug_concept_id integer NOT NULL,
|
|
480
|
+
ingredient_concept_id integer NOT NULL,
|
|
481
|
+
amount_value NUMERIC NULL,
|
|
482
|
+
amount_unit_concept_id integer NULL,
|
|
483
|
+
numerator_value NUMERIC NULL,
|
|
484
|
+
numerator_unit_concept_id integer NULL,
|
|
485
|
+
denominator_value NUMERIC NULL,
|
|
486
|
+
denominator_unit_concept_id integer NULL,
|
|
487
|
+
box_size integer NULL,
|
|
488
|
+
valid_start_date date NOT NULL,
|
|
489
|
+
valid_end_date date NOT NULL,
|
|
490
|
+
invalid_reason varchar(1) NULL );
|
|
491
|
+
|
|
492
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
493
|
+
CREATE TABLE @cdmDatabaseSchema.COHORT_DEFINITION (
|
|
494
|
+
cohort_definition_id integer NOT NULL,
|
|
495
|
+
cohort_definition_name varchar(255) NOT NULL,
|
|
496
|
+
cohort_definition_description TEXT NULL,
|
|
497
|
+
definition_type_concept_id integer NOT NULL,
|
|
498
|
+
cohort_definition_syntax TEXT NULL,
|
|
499
|
+
subject_concept_id integer NOT NULL,
|
|
500
|
+
cohort_initiation_date date NULL );
|
|
501
|
+
|
|
502
|
+
--HINT DISTRIBUTE ON RANDOM
|
|
503
|
+
CREATE TABLE @cdmDatabaseSchema.ATTRIBUTE_DEFINITION (
|
|
504
|
+
attribute_definition_id integer NOT NULL,
|
|
505
|
+
attribute_name varchar(255) NOT NULL,
|
|
506
|
+
attribute_description TEXT NULL,
|
|
507
|
+
attribute_type_concept_id integer NOT NULL,
|
|
508
|
+
attribute_syntax TEXT NULL );
|
|
@@ -0,0 +1,61 @@
|
|
|
1
|
+
{
|
|
2
|
+
"datetime_linked_fields": {
|
|
3
|
+
"condition_occurrence": {
|
|
4
|
+
"condition_start_datetime": "condition_start_date",
|
|
5
|
+
"condition_end_datetime": "condition_end_date"
|
|
6
|
+
},
|
|
7
|
+
"death": {
|
|
8
|
+
"death_datetime": "death_date"
|
|
9
|
+
},
|
|
10
|
+
"drug_exposure": {
|
|
11
|
+
"drug_exposure_start_datetime": "drug_exposure_start_date",
|
|
12
|
+
"drug_exposure_end_datetime": "drug_exposure_end_date"
|
|
13
|
+
},
|
|
14
|
+
"measurement": {
|
|
15
|
+
"measurement_datetime": "measurement_date"
|
|
16
|
+
},
|
|
17
|
+
"observation": {
|
|
18
|
+
"observation_datetime": "observation_date"
|
|
19
|
+
},
|
|
20
|
+
"procedure_occurrence": {
|
|
21
|
+
"procedure_datetime": "procedure_date"
|
|
22
|
+
},
|
|
23
|
+
"specimen": {
|
|
24
|
+
"specimen_datetime": "specimen_date"
|
|
25
|
+
},
|
|
26
|
+
"visit_occurrence": {
|
|
27
|
+
"visit_start_datetime": "visit_start_date",
|
|
28
|
+
"visit_end_datetime": "visit_end_date"
|
|
29
|
+
}
|
|
30
|
+
},
|
|
31
|
+
"date_field_components": {
|
|
32
|
+
"person": {
|
|
33
|
+
"birth_datetime": {
|
|
34
|
+
"year":"year_of_birth",
|
|
35
|
+
"month":"month_of_birth",
|
|
36
|
+
"day":"day_of_birth"
|
|
37
|
+
}
|
|
38
|
+
}
|
|
39
|
+
},
|
|
40
|
+
"person_id_field": {
|
|
41
|
+
"condition_occurrence": "person_id",
|
|
42
|
+
"death": "person_id",
|
|
43
|
+
"drug_exposure": "person_id",
|
|
44
|
+
"measurement": "person_id",
|
|
45
|
+
"observation": "person_id",
|
|
46
|
+
"person": "person_id",
|
|
47
|
+
"procedure_occurrence": "person_id",
|
|
48
|
+
"specimen": "person_id",
|
|
49
|
+
"visit_occurrence": "person_id"
|
|
50
|
+
},
|
|
51
|
+
"auto_number_field": {
|
|
52
|
+
"condition_occurrence": "condition_occurrence_id",
|
|
53
|
+
"death": "death_id",
|
|
54
|
+
"drug_exposure": "drug_exposure_id",
|
|
55
|
+
"measurement": "measurement_id",
|
|
56
|
+
"observation": "observation_id",
|
|
57
|
+
"procedure_occurrence": "procedure_occurrence_id",
|
|
58
|
+
"specimen": "specimen_id",
|
|
59
|
+
"visit_occurrence": "visit_occurrence_id"
|
|
60
|
+
}
|
|
61
|
+
}
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
import os
|
|
2
|
+
import json
|
|
3
|
+
|
|
4
|
+
def load_json(f_in):
|
|
5
|
+
if os.path.exists(f_in):
|
|
6
|
+
data = json.load(open(f_in))
|
|
7
|
+
else:
|
|
8
|
+
try:
|
|
9
|
+
data = json.loads(f_in)
|
|
10
|
+
except Exception as err:
|
|
11
|
+
raise FileNotFoundError(f"{f_in} not found. Or cannot parse as json")
|
|
12
|
+
|
|
13
|
+
return data
|
|
14
|
+
|