carrot-transform 0.3.4__py3-none-any.whl → 0.4.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of carrot-transform might be problematic. Click here for more details.

Files changed (33) hide show
  1. {carrot_transform-0.3.4.dist-info → carrot_transform-0.4.0.dist-info}/METADATA +41 -18
  2. carrot_transform-0.4.0.dist-info/RECORD +41 -0
  3. {carrot_transform-0.3.4.dist-info → carrot_transform-0.4.0.dist-info}/WHEEL +1 -1
  4. carrot_transform-0.4.0.dist-info/entry_points.txt +2 -0
  5. carrottransform/__init__.py +1 -1
  6. carrottransform/_version.py +2 -2
  7. carrottransform/cli/command.py +9 -5
  8. carrottransform/cli/subcommands/run.py +302 -443
  9. carrottransform/cli/subcommands/run_v2.py +145 -0
  10. carrottransform/config/OMOPCDM_postgresql_5.4_ddl.sql +550 -0
  11. carrottransform/examples/test/rules/v1.json +280 -0
  12. carrottransform/examples/test/rules/v2.json +115 -0
  13. carrottransform/tools/__init__.py +4 -14
  14. carrottransform/tools/args.py +128 -0
  15. carrottransform/tools/click.py +21 -0
  16. carrottransform/tools/concept_helpers.py +61 -0
  17. carrottransform/tools/core.py +163 -0
  18. carrottransform/tools/date_helpers.py +79 -0
  19. carrottransform/tools/file_helpers.py +177 -7
  20. carrottransform/tools/logger.py +19 -0
  21. carrottransform/tools/mapping_types.py +32 -0
  22. carrottransform/tools/mappingrules.py +298 -32
  23. carrottransform/tools/metrics.py +274 -49
  24. carrottransform/tools/omopcdm.py +42 -32
  25. carrottransform/tools/orchestrator.py +381 -0
  26. carrottransform/tools/person_helpers.py +126 -0
  27. carrottransform/tools/record_builder.py +413 -0
  28. carrottransform/tools/stream_helpers.py +71 -0
  29. carrottransform/tools/types.py +71 -0
  30. carrottransform/tools/validation.py +62 -0
  31. carrot_transform-0.3.4.dist-info/RECORD +0 -24
  32. carrot_transform-0.3.4.dist-info/entry_points.txt +0 -3
  33. {carrot_transform-0.3.4.dist-info → carrot_transform-0.4.0.dist-info/licenses}/LICENSE +0 -0
@@ -0,0 +1,145 @@
1
+ """
2
+ Entry point for the v2 processing system
3
+ """
4
+
5
+ from pathlib import Path
6
+ from typing import Optional
7
+ import click
8
+ import time
9
+ from carrottransform.tools.click import PathArgs
10
+ from carrottransform.tools.file_helpers import (
11
+ check_dir_isvalid,
12
+ resolve_paths,
13
+ set_omop_filenames,
14
+ )
15
+ from carrottransform.tools.logger import logger_setup
16
+ from carrottransform.tools.orchestrator import V2ProcessingOrchestrator
17
+
18
+ logger = logger_setup()
19
+
20
+
21
+ @click.command()
22
+ @click.option(
23
+ "--rules-file",
24
+ type=PathArgs,
25
+ required=True,
26
+ help="v2 json file containing mapping rules",
27
+ )
28
+ @click.option(
29
+ "--output-dir",
30
+ type=PathArgs,
31
+ required=True,
32
+ help="define the output directory for OMOP-format tsv files",
33
+ )
34
+ @click.option(
35
+ "--write-mode",
36
+ default="w",
37
+ type=click.Choice(["w", "a"]),
38
+ help="force write-mode on output files",
39
+ )
40
+ @click.option(
41
+ "--person-file",
42
+ type=PathArgs,
43
+ required=True,
44
+ help="File containing person_ids in the first column",
45
+ )
46
+ @click.option(
47
+ "--omop-ddl-file",
48
+ type=PathArgs,
49
+ required=False,
50
+ help="File containing OHDSI ddl statements for OMOP tables",
51
+ )
52
+ @click.option(
53
+ "--omop-config-file",
54
+ type=PathArgs,
55
+ required=False,
56
+ help="File containing additional / override json config for omop outputs",
57
+ )
58
+ @click.option(
59
+ "--omop-version",
60
+ required=False,
61
+ help="Quoted string containing omop version - eg '5.3'",
62
+ )
63
+ @click.option("--input-dir", type=PathArgs, required=True, help="Input directories")
64
+ def mapstream_v2(
65
+ rules_file: Path,
66
+ output_dir: Path,
67
+ write_mode: str,
68
+ person_file: Path,
69
+ omop_ddl_file: Optional[Path],
70
+ omop_config_file: Optional[Path],
71
+ omop_version: Optional[str],
72
+ input_dir: Path,
73
+ ):
74
+ """Map to OMOP output using v2 format rules - Refactored Implementation"""
75
+
76
+ start_time = time.time()
77
+
78
+ try:
79
+ # Resolve paths
80
+ resolved_paths = resolve_paths(
81
+ [
82
+ rules_file,
83
+ output_dir,
84
+ person_file,
85
+ omop_ddl_file,
86
+ omop_config_file,
87
+ input_dir,
88
+ ]
89
+ )
90
+ [
91
+ rules_file,
92
+ output_dir,
93
+ person_file,
94
+ omop_ddl_file,
95
+ omop_config_file,
96
+ input_dir,
97
+ ] = resolved_paths # type: ignore
98
+
99
+ # Validate inputs
100
+ check_dir_isvalid(input_dir)
101
+ check_dir_isvalid(output_dir, create_if_missing=True)
102
+
103
+ # Set default OMOP file paths when not explicitly provided
104
+ omop_config_file, omop_ddl_file = set_omop_filenames(
105
+ omop_ddl_file, omop_config_file, omop_version
106
+ )
107
+
108
+ # Create orchestrator and execute processing
109
+ orchestrator = V2ProcessingOrchestrator(
110
+ rules_file=rules_file,
111
+ output_dir=output_dir,
112
+ input_dir=input_dir,
113
+ person_file=person_file,
114
+ omop_ddl_file=omop_ddl_file,
115
+ omop_config_file=omop_config_file,
116
+ write_mode=write_mode,
117
+ )
118
+
119
+ logger.info(
120
+ f"Loaded v2 mapping rules from: {rules_file} in {time.time() - start_time:.5f} secs"
121
+ )
122
+
123
+ result = orchestrator.execute_processing()
124
+
125
+ if result.success:
126
+ logger.info(
127
+ f"V2 processing completed successfully in {time.time() - start_time:.5f} secs"
128
+ )
129
+ else:
130
+ logger.error(f"V2 processing failed: {result.error_message}")
131
+
132
+ except Exception as e:
133
+ logger.error(f"V2 processing failed with error: {str(e)}")
134
+ raise
135
+
136
+
137
+ @click.group(help="V2 Commands for mapping data to the OMOP CommonDataModel (CDM).")
138
+ def run_v2():
139
+ pass
140
+
141
+
142
+ run_v2.add_command(mapstream_v2, "mapstream")
143
+
144
+ if __name__ == "__main__":
145
+ run_v2()
@@ -0,0 +1,550 @@
1
+ --postgresql CDM DDL Specification for OMOP Common Data Model 5.4
2
+
3
+ --HINT DISTRIBUTE ON KEY (person_id)
4
+ CREATE TABLE @cdmDatabaseSchema.PERSON (
5
+ person_id integer NOT NULL,
6
+ gender_concept_id integer NOT NULL,
7
+ year_of_birth integer NOT NULL,
8
+ month_of_birth integer NULL,
9
+ day_of_birth integer NULL,
10
+ birth_datetime TIMESTAMP NULL,
11
+ race_concept_id integer NOT NULL,
12
+ ethnicity_concept_id integer NOT NULL,
13
+ location_id integer NULL,
14
+ provider_id integer NULL,
15
+ care_site_id integer NULL,
16
+ person_source_value varchar(50) NULL,
17
+ gender_source_value varchar(50) NULL,
18
+ gender_source_concept_id integer NULL,
19
+ race_source_value varchar(50) NULL,
20
+ race_source_concept_id integer NULL,
21
+ ethnicity_source_value varchar(50) NULL,
22
+ ethnicity_source_concept_id integer NULL );
23
+
24
+ --HINT DISTRIBUTE ON KEY (person_id)
25
+ CREATE TABLE @cdmDatabaseSchema.OBSERVATION_PERIOD (
26
+ observation_period_id integer NOT NULL,
27
+ person_id integer NOT NULL,
28
+ observation_period_start_date date NOT NULL,
29
+ observation_period_end_date date NOT NULL,
30
+ period_type_concept_id integer NOT NULL );
31
+
32
+ --HINT DISTRIBUTE ON KEY (person_id)
33
+ CREATE TABLE @cdmDatabaseSchema.VISIT_OCCURRENCE (
34
+ visit_occurrence_id integer NOT NULL,
35
+ person_id integer NOT NULL,
36
+ visit_concept_id integer NOT NULL,
37
+ visit_start_date date NOT NULL,
38
+ visit_start_datetime TIMESTAMP NULL,
39
+ visit_end_date date NOT NULL,
40
+ visit_end_datetime TIMESTAMP NULL,
41
+ visit_type_concept_id Integer NOT NULL,
42
+ provider_id integer NULL,
43
+ care_site_id integer NULL,
44
+ visit_source_value varchar(50) NULL,
45
+ visit_source_concept_id integer NULL,
46
+ admitted_from_concept_id integer NULL,
47
+ admitted_from_source_value varchar(50) NULL,
48
+ discharged_to_concept_id integer NULL,
49
+ discharged_to_source_value varchar(50) NULL,
50
+ preceding_visit_occurrence_id integer NULL );
51
+
52
+ --HINT DISTRIBUTE ON KEY (person_id)
53
+ CREATE TABLE @cdmDatabaseSchema.VISIT_DETAIL (
54
+ visit_detail_id integer NOT NULL,
55
+ person_id integer NOT NULL,
56
+ visit_detail_concept_id integer NOT NULL,
57
+ visit_detail_start_date date NOT NULL,
58
+ visit_detail_start_datetime TIMESTAMP NULL,
59
+ visit_detail_end_date date NOT NULL,
60
+ visit_detail_end_datetime TIMESTAMP NULL,
61
+ visit_detail_type_concept_id integer NOT NULL,
62
+ provider_id integer NULL,
63
+ care_site_id integer NULL,
64
+ visit_detail_source_value varchar(50) NULL,
65
+ visit_detail_source_concept_id Integer NULL,
66
+ admitted_from_concept_id Integer NULL,
67
+ admitted_from_source_value varchar(50) NULL,
68
+ discharged_to_source_value varchar(50) NULL,
69
+ discharged_to_concept_id integer NULL,
70
+ preceding_visit_detail_id integer NULL,
71
+ parent_visit_detail_id integer NULL,
72
+ visit_occurrence_id integer NOT NULL );
73
+
74
+ --HINT DISTRIBUTE ON KEY (person_id)
75
+ CREATE TABLE @cdmDatabaseSchema.CONDITION_OCCURRENCE (
76
+ condition_occurrence_id integer NOT NULL,
77
+ person_id integer NOT NULL,
78
+ condition_concept_id integer NOT NULL,
79
+ condition_start_date date NOT NULL,
80
+ condition_start_datetime TIMESTAMP NULL,
81
+ condition_end_date date NULL,
82
+ condition_end_datetime TIMESTAMP NULL,
83
+ condition_type_concept_id integer NOT NULL,
84
+ condition_status_concept_id integer NULL,
85
+ stop_reason varchar(20) NULL,
86
+ provider_id integer NULL,
87
+ visit_occurrence_id integer NULL,
88
+ visit_detail_id integer NULL,
89
+ condition_source_value varchar(50) NULL,
90
+ condition_source_concept_id integer NULL,
91
+ condition_status_source_value varchar(50) NULL );
92
+
93
+ --HINT DISTRIBUTE ON KEY (person_id)
94
+ CREATE TABLE @cdmDatabaseSchema.DRUG_EXPOSURE (
95
+ drug_exposure_id integer NOT NULL,
96
+ person_id integer NOT NULL,
97
+ drug_concept_id integer NOT NULL,
98
+ drug_exposure_start_date date NOT NULL,
99
+ drug_exposure_start_datetime TIMESTAMP NULL,
100
+ drug_exposure_end_date date NOT NULL,
101
+ drug_exposure_end_datetime TIMESTAMP NULL,
102
+ verbatim_end_date date NULL,
103
+ drug_type_concept_id integer NOT NULL,
104
+ stop_reason varchar(20) NULL,
105
+ refills integer NULL,
106
+ quantity NUMERIC NULL,
107
+ days_supply integer NULL,
108
+ sig TEXT NULL,
109
+ route_concept_id integer NULL,
110
+ lot_number varchar(50) NULL,
111
+ provider_id integer NULL,
112
+ visit_occurrence_id integer NULL,
113
+ visit_detail_id integer NULL,
114
+ drug_source_value varchar(50) NULL,
115
+ drug_source_concept_id integer NULL,
116
+ route_source_value varchar(50) NULL,
117
+ dose_unit_source_value varchar(50) NULL );
118
+
119
+ --HINT DISTRIBUTE ON KEY (person_id)
120
+ CREATE TABLE @cdmDatabaseSchema.PROCEDURE_OCCURRENCE (
121
+ procedure_occurrence_id integer NOT NULL,
122
+ person_id integer NOT NULL,
123
+ procedure_concept_id integer NOT NULL,
124
+ procedure_date date NOT NULL,
125
+ procedure_datetime TIMESTAMP NULL,
126
+ procedure_end_date date NULL,
127
+ procedure_end_datetime TIMESTAMP NULL,
128
+ procedure_type_concept_id integer NOT NULL,
129
+ modifier_concept_id integer NULL,
130
+ quantity integer NULL,
131
+ provider_id integer NULL,
132
+ visit_occurrence_id integer NULL,
133
+ visit_detail_id integer NULL,
134
+ procedure_source_value varchar(50) NULL,
135
+ procedure_source_concept_id integer NULL,
136
+ modifier_source_value varchar(50) NULL );
137
+
138
+ --HINT DISTRIBUTE ON KEY (person_id)
139
+ CREATE TABLE @cdmDatabaseSchema.DEVICE_EXPOSURE (
140
+ device_exposure_id integer NOT NULL,
141
+ person_id integer NOT NULL,
142
+ device_concept_id integer NOT NULL,
143
+ device_exposure_start_date date NOT NULL,
144
+ device_exposure_start_datetime TIMESTAMP NULL,
145
+ device_exposure_end_date date NULL,
146
+ device_exposure_end_datetime TIMESTAMP NULL,
147
+ device_type_concept_id integer NOT NULL,
148
+ unique_device_id varchar(255) NULL,
149
+ production_id varchar(255) NULL,
150
+ quantity integer NULL,
151
+ provider_id integer NULL,
152
+ visit_occurrence_id integer NULL,
153
+ visit_detail_id integer NULL,
154
+ device_source_value varchar(50) NULL,
155
+ device_source_concept_id integer NULL,
156
+ unit_concept_id integer NULL,
157
+ unit_source_value varchar(50) NULL,
158
+ unit_source_concept_id integer NULL );
159
+
160
+ --HINT DISTRIBUTE ON KEY (person_id)
161
+ CREATE TABLE @cdmDatabaseSchema.MEASUREMENT (
162
+ measurement_id integer NOT NULL,
163
+ person_id integer NOT NULL,
164
+ measurement_concept_id integer NOT NULL,
165
+ measurement_date date NOT NULL,
166
+ measurement_datetime TIMESTAMP NULL,
167
+ measurement_time varchar(10) NULL,
168
+ measurement_type_concept_id integer NOT NULL,
169
+ operator_concept_id integer NULL,
170
+ value_as_number NUMERIC NULL,
171
+ value_as_concept_id integer NULL,
172
+ unit_concept_id integer NULL,
173
+ range_low NUMERIC NULL,
174
+ range_high NUMERIC NULL,
175
+ provider_id integer NULL,
176
+ visit_occurrence_id integer NULL,
177
+ visit_detail_id integer NULL,
178
+ measurement_source_value varchar(50) NULL,
179
+ measurement_source_concept_id integer NULL,
180
+ unit_source_value varchar(50) NULL,
181
+ unit_source_concept_id integer NULL,
182
+ value_source_value varchar(50) NULL,
183
+ measurement_event_id bigint NULL,
184
+ meas_event_field_concept_id integer NULL );
185
+
186
+ --HINT DISTRIBUTE ON KEY (person_id)
187
+ CREATE TABLE @cdmDatabaseSchema.OBSERVATION (
188
+ observation_id integer NOT NULL,
189
+ person_id integer NOT NULL,
190
+ observation_concept_id integer NOT NULL,
191
+ observation_date date NOT NULL,
192
+ observation_datetime TIMESTAMP NULL,
193
+ observation_type_concept_id integer NOT NULL,
194
+ value_as_number NUMERIC NULL,
195
+ value_as_string varchar(60) NULL,
196
+ value_as_concept_id Integer NULL,
197
+ qualifier_concept_id integer NULL,
198
+ unit_concept_id integer NULL,
199
+ provider_id integer NULL,
200
+ visit_occurrence_id integer NULL,
201
+ visit_detail_id integer NULL,
202
+ observation_source_value varchar(50) NULL,
203
+ observation_source_concept_id integer NULL,
204
+ unit_source_value varchar(50) NULL,
205
+ qualifier_source_value varchar(50) NULL,
206
+ value_source_value varchar(50) NULL,
207
+ observation_event_id bigint NULL,
208
+ obs_event_field_concept_id integer NULL );
209
+
210
+ --HINT DISTRIBUTE ON KEY (person_id)
211
+ CREATE TABLE @cdmDatabaseSchema.DEATH (
212
+ person_id integer NOT NULL,
213
+ death_date date NOT NULL,
214
+ death_datetime TIMESTAMP NULL,
215
+ death_type_concept_id integer NULL,
216
+ cause_concept_id integer NULL,
217
+ cause_source_value varchar(50) NULL,
218
+ cause_source_concept_id integer NULL );
219
+
220
+ --HINT DISTRIBUTE ON KEY (person_id)
221
+ CREATE TABLE @cdmDatabaseSchema.NOTE (
222
+ note_id integer NOT NULL,
223
+ person_id integer NOT NULL,
224
+ note_date date NOT NULL,
225
+ note_datetime TIMESTAMP NULL,
226
+ note_type_concept_id integer NOT NULL,
227
+ note_class_concept_id integer NOT NULL,
228
+ note_title varchar(250) NULL,
229
+ note_text TEXT NOT NULL,
230
+ encoding_concept_id integer NOT NULL,
231
+ language_concept_id integer NOT NULL,
232
+ provider_id integer NULL,
233
+ visit_occurrence_id integer NULL,
234
+ visit_detail_id integer NULL,
235
+ note_source_value varchar(50) NULL,
236
+ note_event_id bigint NULL,
237
+ note_event_field_concept_id integer NULL );
238
+
239
+ --HINT DISTRIBUTE ON RANDOM
240
+ CREATE TABLE @cdmDatabaseSchema.NOTE_NLP (
241
+ note_nlp_id integer NOT NULL,
242
+ note_id integer NOT NULL,
243
+ section_concept_id integer NULL,
244
+ snippet varchar(250) NULL,
245
+ "offset" varchar(50) NULL,
246
+ lexical_variant varchar(250) NOT NULL,
247
+ note_nlp_concept_id integer NULL,
248
+ note_nlp_source_concept_id integer NULL,
249
+ nlp_system varchar(250) NULL,
250
+ nlp_date date NOT NULL,
251
+ nlp_datetime TIMESTAMP NULL,
252
+ term_exists varchar(1) NULL,
253
+ term_temporal varchar(50) NULL,
254
+ term_modifiers varchar(2000) NULL );
255
+
256
+ --HINT DISTRIBUTE ON KEY (person_id)
257
+ CREATE TABLE @cdmDatabaseSchema.SPECIMEN (
258
+ specimen_id integer NOT NULL,
259
+ person_id integer NOT NULL,
260
+ specimen_concept_id integer NOT NULL,
261
+ specimen_type_concept_id integer NOT NULL,
262
+ specimen_date date NOT NULL,
263
+ specimen_datetime TIMESTAMP NULL,
264
+ quantity NUMERIC NULL,
265
+ unit_concept_id integer NULL,
266
+ anatomic_site_concept_id integer NULL,
267
+ disease_status_concept_id integer NULL,
268
+ specimen_source_id varchar(50) NULL,
269
+ specimen_source_value varchar(50) NULL,
270
+ unit_source_value varchar(50) NULL,
271
+ anatomic_site_source_value varchar(50) NULL,
272
+ disease_status_source_value varchar(50) NULL );
273
+
274
+ --HINT DISTRIBUTE ON RANDOM
275
+ CREATE TABLE @cdmDatabaseSchema.FACT_RELATIONSHIP (
276
+ domain_concept_id_1 integer NOT NULL,
277
+ fact_id_1 integer NOT NULL,
278
+ domain_concept_id_2 integer NOT NULL,
279
+ fact_id_2 integer NOT NULL,
280
+ relationship_concept_id integer NOT NULL );
281
+
282
+ --HINT DISTRIBUTE ON RANDOM
283
+ CREATE TABLE @cdmDatabaseSchema.LOCATION (
284
+ location_id integer NOT NULL,
285
+ address_1 varchar(50) NULL,
286
+ address_2 varchar(50) NULL,
287
+ city varchar(50) NULL,
288
+ state varchar(2) NULL,
289
+ zip varchar(9) NULL,
290
+ county varchar(20) NULL,
291
+ location_source_value varchar(50) NULL,
292
+ country_concept_id integer NULL,
293
+ country_source_value varchar(80) NULL,
294
+ latitude NUMERIC NULL,
295
+ longitude NUMERIC NULL );
296
+
297
+ --HINT DISTRIBUTE ON RANDOM
298
+ CREATE TABLE @cdmDatabaseSchema.CARE_SITE (
299
+ care_site_id integer NOT NULL,
300
+ care_site_name varchar(255) NULL,
301
+ place_of_service_concept_id integer NULL,
302
+ location_id integer NULL,
303
+ care_site_source_value varchar(50) NULL,
304
+ place_of_service_source_value varchar(50) NULL );
305
+
306
+ --HINT DISTRIBUTE ON RANDOM
307
+ CREATE TABLE @cdmDatabaseSchema.PROVIDER (
308
+ provider_id integer NOT NULL,
309
+ provider_name varchar(255) NULL,
310
+ npi varchar(20) NULL,
311
+ dea varchar(20) NULL,
312
+ specialty_concept_id integer NULL,
313
+ care_site_id integer NULL,
314
+ year_of_birth integer NULL,
315
+ gender_concept_id integer NULL,
316
+ provider_source_value varchar(50) NULL,
317
+ specialty_source_value varchar(50) NULL,
318
+ specialty_source_concept_id integer NULL,
319
+ gender_source_value varchar(50) NULL,
320
+ gender_source_concept_id integer NULL );
321
+
322
+ --HINT DISTRIBUTE ON KEY (person_id)
323
+ CREATE TABLE @cdmDatabaseSchema.PAYER_PLAN_PERIOD (
324
+ payer_plan_period_id integer NOT NULL,
325
+ person_id integer NOT NULL,
326
+ payer_plan_period_start_date date NOT NULL,
327
+ payer_plan_period_end_date date NOT NULL,
328
+ payer_concept_id integer NULL,
329
+ payer_source_value varchar(50) NULL,
330
+ payer_source_concept_id integer NULL,
331
+ plan_concept_id integer NULL,
332
+ plan_source_value varchar(50) NULL,
333
+ plan_source_concept_id integer NULL,
334
+ sponsor_concept_id integer NULL,
335
+ sponsor_source_value varchar(50) NULL,
336
+ sponsor_source_concept_id integer NULL,
337
+ family_source_value varchar(50) NULL,
338
+ stop_reason_concept_id integer NULL,
339
+ stop_reason_source_value varchar(50) NULL,
340
+ stop_reason_source_concept_id integer NULL );
341
+
342
+ --HINT DISTRIBUTE ON RANDOM
343
+ CREATE TABLE @cdmDatabaseSchema.COST (
344
+ cost_id integer NOT NULL,
345
+ cost_event_id integer NOT NULL,
346
+ cost_domain_id varchar(20) NOT NULL,
347
+ cost_type_concept_id integer NOT NULL,
348
+ currency_concept_id integer NULL,
349
+ total_charge NUMERIC NULL,
350
+ total_cost NUMERIC NULL,
351
+ total_paid NUMERIC NULL,
352
+ paid_by_payer NUMERIC NULL,
353
+ paid_by_patient NUMERIC NULL,
354
+ paid_patient_copay NUMERIC NULL,
355
+ paid_patient_coinsurance NUMERIC NULL,
356
+ paid_patient_deductible NUMERIC NULL,
357
+ paid_by_primary NUMERIC NULL,
358
+ paid_ingredient_cost NUMERIC NULL,
359
+ paid_dispensing_fee NUMERIC NULL,
360
+ payer_plan_period_id integer NULL,
361
+ amount_allowed NUMERIC NULL,
362
+ revenue_code_concept_id integer NULL,
363
+ revenue_code_source_value varchar(50) NULL,
364
+ drg_concept_id integer NULL,
365
+ drg_source_value varchar(3) NULL );
366
+
367
+ --HINT DISTRIBUTE ON KEY (person_id)
368
+ CREATE TABLE @cdmDatabaseSchema.DRUG_ERA (
369
+ drug_era_id integer NOT NULL,
370
+ person_id integer NOT NULL,
371
+ drug_concept_id integer NOT NULL,
372
+ drug_era_start_date TIMESTAMP NOT NULL,
373
+ drug_era_end_date TIMESTAMP NOT NULL,
374
+ drug_exposure_count integer NULL,
375
+ gap_days integer NULL );
376
+
377
+ --HINT DISTRIBUTE ON KEY (person_id)
378
+ CREATE TABLE @cdmDatabaseSchema.DOSE_ERA (
379
+ dose_era_id integer NOT NULL,
380
+ person_id integer NOT NULL,
381
+ drug_concept_id integer NOT NULL,
382
+ unit_concept_id integer NOT NULL,
383
+ dose_value NUMERIC NOT NULL,
384
+ dose_era_start_date TIMESTAMP NOT NULL,
385
+ dose_era_end_date TIMESTAMP NOT NULL );
386
+
387
+ --HINT DISTRIBUTE ON KEY (person_id)
388
+ CREATE TABLE @cdmDatabaseSchema.CONDITION_ERA (
389
+ condition_era_id integer NOT NULL,
390
+ person_id integer NOT NULL,
391
+ condition_concept_id integer NOT NULL,
392
+ condition_era_start_date TIMESTAMP NOT NULL,
393
+ condition_era_end_date TIMESTAMP NOT NULL,
394
+ condition_occurrence_count integer NULL );
395
+
396
+ --HINT DISTRIBUTE ON KEY (person_id)
397
+ CREATE TABLE @cdmDatabaseSchema.EPISODE (
398
+ episode_id bigint NOT NULL,
399
+ person_id bigint NOT NULL,
400
+ episode_concept_id integer NOT NULL,
401
+ episode_start_date date NOT NULL,
402
+ episode_start_datetime TIMESTAMP NULL,
403
+ episode_end_date date NULL,
404
+ episode_end_datetime TIMESTAMP NULL,
405
+ episode_parent_id bigint NULL,
406
+ episode_number integer NULL,
407
+ episode_object_concept_id integer NOT NULL,
408
+ episode_type_concept_id integer NOT NULL,
409
+ episode_source_value varchar(50) NULL,
410
+ episode_source_concept_id integer NULL );
411
+
412
+ --HINT DISTRIBUTE ON RANDOM
413
+ CREATE TABLE @cdmDatabaseSchema.EPISODE_EVENT (
414
+ episode_id bigint NOT NULL,
415
+ event_id bigint NOT NULL,
416
+ episode_event_field_concept_id integer NOT NULL );
417
+
418
+ --HINT DISTRIBUTE ON RANDOM
419
+ CREATE TABLE @cdmDatabaseSchema.METADATA (
420
+ metadata_id integer NOT NULL,
421
+ metadata_concept_id integer NOT NULL,
422
+ metadata_type_concept_id integer NOT NULL,
423
+ name varchar(250) NOT NULL,
424
+ value_as_string varchar(250) NULL,
425
+ value_as_concept_id integer NULL,
426
+ value_as_number NUMERIC NULL,
427
+ metadata_date date NULL,
428
+ metadata_datetime TIMESTAMP NULL );
429
+
430
+ --HINT DISTRIBUTE ON RANDOM
431
+ CREATE TABLE @cdmDatabaseSchema.CDM_SOURCE (
432
+ cdm_source_name varchar(255) NOT NULL,
433
+ cdm_source_abbreviation varchar(25) NOT NULL,
434
+ cdm_holder varchar(255) NOT NULL,
435
+ source_description TEXT NULL,
436
+ source_documentation_reference varchar(255) NULL,
437
+ cdm_etl_reference varchar(255) NULL,
438
+ source_release_date date NOT NULL,
439
+ cdm_release_date date NOT NULL,
440
+ cdm_version varchar(10) NULL,
441
+ cdm_version_concept_id integer NOT NULL,
442
+ vocabulary_version varchar(20) NOT NULL );
443
+
444
+ --HINT DISTRIBUTE ON RANDOM
445
+ CREATE TABLE @cdmDatabaseSchema.CONCEPT (
446
+ concept_id integer NOT NULL,
447
+ concept_name varchar(255) NOT NULL,
448
+ domain_id varchar(20) NOT NULL,
449
+ vocabulary_id varchar(20) NOT NULL,
450
+ concept_class_id varchar(20) NOT NULL,
451
+ standard_concept varchar(1) NULL,
452
+ concept_code varchar(50) NOT NULL,
453
+ valid_start_date date NOT NULL,
454
+ valid_end_date date NOT NULL,
455
+ invalid_reason varchar(1) NULL );
456
+
457
+ --HINT DISTRIBUTE ON RANDOM
458
+ CREATE TABLE @cdmDatabaseSchema.VOCABULARY (
459
+ vocabulary_id varchar(20) NOT NULL,
460
+ vocabulary_name varchar(255) NOT NULL,
461
+ vocabulary_reference varchar(255) NULL,
462
+ vocabulary_version varchar(255) NULL,
463
+ vocabulary_concept_id integer NOT NULL );
464
+
465
+ --HINT DISTRIBUTE ON RANDOM
466
+ CREATE TABLE @cdmDatabaseSchema.DOMAIN (
467
+ domain_id varchar(20) NOT NULL,
468
+ domain_name varchar(255) NOT NULL,
469
+ domain_concept_id integer NOT NULL );
470
+
471
+ --HINT DISTRIBUTE ON RANDOM
472
+ CREATE TABLE @cdmDatabaseSchema.CONCEPT_CLASS (
473
+ concept_class_id varchar(20) NOT NULL,
474
+ concept_class_name varchar(255) NOT NULL,
475
+ concept_class_concept_id integer NOT NULL );
476
+
477
+ --HINT DISTRIBUTE ON RANDOM
478
+ CREATE TABLE @cdmDatabaseSchema.CONCEPT_RELATIONSHIP (
479
+ concept_id_1 integer NOT NULL,
480
+ concept_id_2 integer NOT NULL,
481
+ relationship_id varchar(20) NOT NULL,
482
+ valid_start_date date NOT NULL,
483
+ valid_end_date date NOT NULL,
484
+ invalid_reason varchar(1) NULL );
485
+
486
+ --HINT DISTRIBUTE ON RANDOM
487
+ CREATE TABLE @cdmDatabaseSchema.RELATIONSHIP (
488
+ relationship_id varchar(20) NOT NULL,
489
+ relationship_name varchar(255) NOT NULL,
490
+ is_hierarchical varchar(1) NOT NULL,
491
+ defines_ancestry varchar(1) NOT NULL,
492
+ reverse_relationship_id varchar(20) NOT NULL,
493
+ relationship_concept_id integer NOT NULL );
494
+
495
+ --HINT DISTRIBUTE ON RANDOM
496
+ CREATE TABLE @cdmDatabaseSchema.CONCEPT_SYNONYM (
497
+ concept_id integer NOT NULL,
498
+ concept_synonym_name varchar(1000) NOT NULL,
499
+ language_concept_id integer NOT NULL );
500
+
501
+ --HINT DISTRIBUTE ON RANDOM
502
+ CREATE TABLE @cdmDatabaseSchema.CONCEPT_ANCESTOR (
503
+ ancestor_concept_id integer NOT NULL,
504
+ descendant_concept_id integer NOT NULL,
505
+ min_levels_of_separation integer NOT NULL,
506
+ max_levels_of_separation integer NOT NULL );
507
+
508
+ --HINT DISTRIBUTE ON RANDOM
509
+ CREATE TABLE @cdmDatabaseSchema.SOURCE_TO_CONCEPT_MAP (
510
+ source_code varchar(50) NOT NULL,
511
+ source_concept_id integer NOT NULL,
512
+ source_vocabulary_id varchar(20) NOT NULL,
513
+ source_code_description varchar(255) NULL,
514
+ target_concept_id integer NOT NULL,
515
+ target_vocabulary_id varchar(20) NOT NULL,
516
+ valid_start_date date NOT NULL,
517
+ valid_end_date date NOT NULL,
518
+ invalid_reason varchar(1) NULL );
519
+
520
+ --HINT DISTRIBUTE ON RANDOM
521
+ CREATE TABLE @cdmDatabaseSchema.DRUG_STRENGTH (
522
+ drug_concept_id integer NOT NULL,
523
+ ingredient_concept_id integer NOT NULL,
524
+ amount_value NUMERIC NULL,
525
+ amount_unit_concept_id integer NULL,
526
+ numerator_value NUMERIC NULL,
527
+ numerator_unit_concept_id integer NULL,
528
+ denominator_value NUMERIC NULL,
529
+ denominator_unit_concept_id integer NULL,
530
+ box_size integer NULL,
531
+ valid_start_date date NOT NULL,
532
+ valid_end_date date NOT NULL,
533
+ invalid_reason varchar(1) NULL );
534
+
535
+ --HINT DISTRIBUTE ON RANDOM
536
+ CREATE TABLE @cdmDatabaseSchema.COHORT (
537
+ cohort_definition_id integer NOT NULL,
538
+ subject_id integer NOT NULL,
539
+ cohort_start_date date NOT NULL,
540
+ cohort_end_date date NOT NULL );
541
+
542
+ --HINT DISTRIBUTE ON RANDOM
543
+ CREATE TABLE @cdmDatabaseSchema.COHORT_DEFINITION (
544
+ cohort_definition_id integer NOT NULL,
545
+ cohort_definition_name varchar(255) NOT NULL,
546
+ cohort_definition_description TEXT NULL,
547
+ definition_type_concept_id integer NOT NULL,
548
+ cohort_definition_syntax TEXT NULL,
549
+ subject_concept_id integer NOT NULL,
550
+ cohort_initiation_date date NULL );