-
Notifications
You must be signed in to change notification settings - Fork 9
/
Copy pathetlMapping.yaml
155 lines (154 loc) · 4.38 KB
/
etlMapping.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
mappings:
- name: gen3.biodatacatalyst.nhlbi.nih.gov_subject
doc_type: subject
type: aggregator
root: subject
props:
- name: submitter_id
- name: project_id
- name: consent_codes
- name: geographic_site
flatten_props:
- path: demographics
props:
- name: age_at_index
- name: hispanic_subgroup
- name: subcohort
- name: weight_baseline
- name: bmi_baseline
- name: height_baseline
- path: medical_histories
props:
- name: diabetes
- name: hypertension
- name: cerebrovascular_disease
- name: chronic_respiratory_disease
- name: coronary_artery_disease
- name: asthma
- name: cabg_presence
- name: copd
- name: emphysema
- name: heart_failure
- name: myocardial_infarction
- name: stroke
- name: cac_score
- name: cac_volume
- name: carotid_plaque
- name: carotid_stenosis
- name: cimt_1
- name: cimt_2
- name: vte_case_status
- name: vte_followup_start_age
- name: vte_prior_history
- path: medication_records
props:
- name: hypertension_meds
- name: antihypertensive_meds
- name: fasting_lipids
- name: lipid_lowering_medication
- path: lab_results
props:
- name: lymphocyte_ncnc_bld
- name: mch_entmass_rbc
- name: mcv_entvol_rbc
- name: mchc_mcnc_rbc
- name: monocyte_ncnc_bld
- name: neutrophil_ncnc_bld
- name: pmv_entvol_bld
- name: rbc_ncnc_bld
- name: rdw_ratio_rbc
- name: hemoglobin_mcnc_bld
- name: platelet_ncnc_bld
- name: hematocrit_vfr_bld
- name: wbc_ncnc_bld
- name: basophil_ncnc_bld
- name: eosinophil_ncnc_bld
- name: unit_triglycerides
- name: hdl
- name: ldl
- name: triglycerides
- name: total_cholesterol
aggregated_props:
- name: annotated_sex
path: demographics
src: annotated_sex
fn: set
- name: race
path: demographics
src: race
fn: set
- name: ethnicity
path: demographics
src: ethnicity
fn: set
- name: _samples_count
path: samples
fn: count
- name: _aliquots_count
path: samples.aliquots
fn: count
- name: _read_groups_count
path: samples.aliquots.read_groups
fn: count
- name: _submitted_unaligned_reads_files_count
path: samples.aliquots.read_groups.submitted_unaligned_reads_files
fn: count
- name: _submitted_aligned_reads_files_count
path: samples.aliquots.read_groups.submitted_aligned_reads_files
fn: count
- name: _simple_germline_variations_count
path: samples.aliquots.read_groups.simple_germline_variations
fn: count
- name: current_smoker_baseline
path: exposures
src: current_smoker_baseline
fn: set
- name: ever_smoker_baseline
path: exposures
src: ever_smoker_baseline
fn: set
parent_props:
- path: studies[studies_submitter_id:submitter_id].projects[code]
- path: studies[studies_submitter_id:submitter_id].projects[code].programs[programs_name:name]
joining_props:
- index: file
join_on: _subject_id
props:
- name: data_format
src: data_format
fn: set
- name: data_type
src: data_type
fn: set
- name: file_count
src: _file_id
fn: count
- name: gen3.biodatacatalyst.nhlbi.nih.gov_file
doc_type: file
type: collector
root: None
category: data_file
props:
- name: object_id
- name: md5sum
- name: file_name
- name: file_size
- name: data_category
- name: data_format
- name: data_type
- name: state
- name: callset
- name: bucket_path
- name: source_node
injecting_props:
subject:
props:
- name: _subject_id
src: id
fn: set
- name: project_id
program:
props:
- name: programs_name
src: name
fn: set