-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathcbio_database_views.sql
179 lines (169 loc) · 8.87 KB
/
cbio_database_views.sql
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
# sample
CREATE VIEW view_sample AS
SELECT
concat(cs.CANCER_STUDY_IDENTIFIER, '_', sample.STABLE_ID) as sample_unique_id,
sample.STABLE_ID as sample_stable_id,
concat(cs.CANCER_STUDY_IDENTIFIER, '_', p.STABLE_ID) as patient_unique_id,
p.STABLE_ID as patient_stable_id,
cs.CANCER_STUDY_IDENTIFIER as cancer_study_identifier
FROM sample
INNER JOIN patient p on sample.PATIENT_ID = p.INTERNAL_ID
INNER JOIN cancer_study cs on p.CANCER_STUDY_ID = cs.CANCER_STUDY_ID;
# sample list
CREATE VIEW view_sample_list AS
SELECT
concat(cs.CANCER_STUDY_IDENTIFIER, '_', s.STABLE_ID) as sample_unique_id,
sl.STABLE_ID as sample_list_stable_id,
sl.NAME as name,
cs.CANCER_STUDY_IDENTIFIER as cancer_study_identifier
FROM sample_list as sl
INNER JOIN sample_list_list as sll ON sll.LIST_ID = sl.LIST_ID
INNER JOIN sample as s ON s.INTERNAL_ID = sll.SAMPLE_ID
INNER JOIN cancer_study cs on sl.CANCER_STUDY_ID = cs.CANCER_STUDY_ID;
# genomic_event - mutation
CREATE VIEW view_genomic_event_mutation AS
SELECT
concat(cs.CANCER_STUDY_IDENTIFIER, '_', sample.STABLE_ID) as sample_unique_id,
gene.HUGO_GENE_SYMBOL as hugo_gene_symbol,
me.PROTEIN_CHANGE as variant,
gp.STABLE_ID as gene_panel_stable_id,
cs.CANCER_STUDY_IDENTIFIER as cancer_study_identifier,
g.STABLE_ID as genetic_profile_stable_id
FROM mutation
LEFT JOIN mutation_event as me ON mutation.MUTATION_EVENT_ID = me.MUTATION_EVENT_ID
LEFT JOIN sample_profile sp on mutation.SAMPLE_ID = sp.SAMPLE_ID and mutation.GENETIC_PROFILE_ID = sp.GENETIC_PROFILE_ID
LEFT JOIN gene_panel gp on sp.PANEL_ID = gp.INTERNAL_ID
LEFT JOIN genetic_profile g on sp.GENETIC_PROFILE_ID = g.GENETIC_PROFILE_ID
LEFT JOIN cancer_study cs on g.CANCER_STUDY_ID = cs.CANCER_STUDY_ID
LEFT JOIN sample on mutation.SAMPLE_ID = sample.INTERNAL_ID
LEFT JOIN gene ON mutation.ENTREZ_GENE_ID = gene.ENTREZ_GENE_ID;
# genomic_event - CNA
CREATE VIEW view_genomic_event_cna AS
SELECT
concat(cs.CANCER_STUDY_IDENTIFIER, '_', sample.STABLE_ID) as sample_unique_id,
gene.HUGO_GENE_SYMBOL as hugo_gene_symbol,
convert(ce.ALTERATION, char) as variant,
gene_panel.STABLE_ID as gene_panel_stable_id,
cs.CANCER_STUDY_IDENTIFIER as cancer_study_identifier,
gp.STABLE_ID as genetic_profile_stable_id
FROM sample_cna_event
LEFT JOIN cna_event ce on sample_cna_event.CNA_EVENT_ID = ce.CNA_EVENT_ID
LEFT JOIN gene on ce.ENTREZ_GENE_ID = gene.ENTREZ_GENE_ID
LEFT JOIN genetic_profile gp on sample_cna_event.GENETIC_PROFILE_ID = gp.GENETIC_PROFILE_ID
LEFT JOIN sample_profile sp on gp.GENETIC_PROFILE_ID = sp.GENETIC_PROFILE_ID
LEFT JOIN cancer_study cs on gp.CANCER_STUDY_ID = cs.CANCER_STUDY_ID
LEFT JOIN sample on sample_cna_event.SAMPLE_ID = sample.INTERNAL_ID
LEFT JOIN gene_panel ON sp.PANEL_ID = gene_panel.INTERNAL_ID;
# genomic_event - SV - Beware SVs are added as two events.
CREATE VIEW view_genomic_event_struct_var AS
SELECT
concat(cs.CANCER_STUDY_IDENTIFIER, '_', s.STABLE_ID) as sample_unique_id,
hugo_gene_symbol,
Event_Info as variant,
g.STABLE_ID as gene_panel_stable_id,
cs.CANCER_STUDY_IDENTIFIER as cancer_study_identifier,
gp.STABLE_ID as genetic_profile_stable_id
FROM structural_variant as sv
LEFT JOIN (SELECT ENTREZ_GENE_ID, HUGO_GENE_SYMBOL as hugo_gene_symbol FROM gene) gene1 on gene1.ENTREZ_GENE_ID = sv.SITE1_ENTREZ_GENE_ID
LEFT OUTER JOIN genetic_profile gp on gp.GENETIC_PROFILE_ID = sv.GENETIC_PROFILE_ID
LEFT JOIN sample s on sv.SAMPLE_ID = s.INTERNAL_ID
LEFT JOIN cancer_study cs on gp.CANCER_STUDY_ID = cs.CANCER_STUDY_ID
LEFT JOIN sample_profile sp on gp.GENETIC_PROFILE_ID = sp.GENETIC_PROFILE_ID
LEFT JOIN gene_panel g on sp.PANEL_ID = g.INTERNAL_ID
UNION ALL
SELECT
concat(cs.CANCER_STUDY_IDENTIFIER, '_', s.STABLE_ID) as sample_unique_id,
hugo_gene_symbol,
Event_Info as variant,
g.STABLE_ID as gene_panel_stable_id,
cs.CANCER_STUDY_IDENTIFIER as cancer_study_identifier,
gp.STABLE_ID as genetic_profile_stable_id
FROM structural_variant as sv
LEFT JOIN (SELECT ENTREZ_GENE_ID, HUGO_GENE_SYMBOL as hugo_gene_symbol FROM gene) gene2 on gene2.ENTREZ_GENE_ID = sv.SITE2_ENTREZ_GENE_ID
LEFT OUTER JOIN genetic_profile gp on gp.GENETIC_PROFILE_ID = sv.GENETIC_PROFILE_ID
LEFT JOIN sample s on sv.SAMPLE_ID = s.INTERNAL_ID
LEFT JOIN cancer_study cs on gp.CANCER_STUDY_ID = cs.CANCER_STUDY_ID
LEFT JOIN sample_profile sp on gp.GENETIC_PROFILE_ID = sp.GENETIC_PROFILE_ID
LEFT JOIN gene_panel g on sp.PANEL_ID = g.INTERNAL_ID;
-- structural variant
CREATE VIEW view_structural_variant AS
SELECT
concat(cs.CANCER_STUDY_IDENTIFIER, '_', s.STABLE_ID) as sample_unique_id,
gene1.HUGO_GENE_SYMBOL as hugo_symbol_gene1,
gene2.HUGO_GENE_SYMBOL as hugo_symbol_gene2,
g.STABLE_ID as gene_panel_stable_id,
cs.CANCER_STUDY_IDENTIFIER as cancer_study_identifier,
gp.STABLE_ID as genetic_profile_stable_id
FROM structural_variant as sv
LEFT JOIN (SELECT ENTREZ_GENE_ID, HUGO_GENE_SYMBOL FROM gene) gene1 on gene1.ENTREZ_GENE_ID = sv.SITE1_ENTREZ_GENE_ID
LEFT JOIN (SELECT ENTREZ_GENE_ID, HUGO_GENE_SYMBOL FROM gene) gene2 on gene2.ENTREZ_GENE_ID = sv.SITE2_ENTREZ_GENE_ID
LEFT OUTER JOIN genetic_profile gp on gp.GENETIC_PROFILE_ID = sv.GENETIC_PROFILE_ID
LEFT JOIN sample s on sv.SAMPLE_ID = s.INTERNAL_ID
LEFT JOIN cancer_study cs on gp.CANCER_STUDY_ID = cs.CANCER_STUDY_ID
LEFT JOIN sample_profile sp on gp.GENETIC_PROFILE_ID = sp.GENETIC_PROFILE_ID
LEFT JOIN gene_panel g on sp.PANEL_ID = g.INTERNAL_ID;
# CNA
CREATE VIEW view_cna AS
SELECT
concat(cs.CANCER_STUDY_IDENTIFIER, '_', sample.STABLE_ID) as sample_unique_id,
gene.HUGO_GENE_SYMBOL as hugo_gene_symbol,
ce.ALTERATION as alteration,
gene_panel.STABLE_ID as gene_panel_stable_id,
cs.CANCER_STUDY_IDENTIFIER as cancer_study_identifier,
gp.STABLE_ID as genetic_profile_stable_id
FROM sample_cna_event
LEFT JOIN cna_event ce on sample_cna_event.CNA_EVENT_ID = ce.CNA_EVENT_ID
LEFT JOIN gene on ce.ENTREZ_GENE_ID = gene.ENTREZ_GENE_ID
LEFT JOIN genetic_profile gp on sample_cna_event.GENETIC_PROFILE_ID = gp.GENETIC_PROFILE_ID
LEFT JOIN sample_profile sp on gp.GENETIC_PROFILE_ID = sp.GENETIC_PROFILE_ID
LEFT JOIN cancer_study cs on gp.CANCER_STUDY_ID = cs.CANCER_STUDY_ID
LEFT JOIN sample on sample_cna_event.SAMPLE_ID = sample.INTERNAL_ID
LEFT JOIN gene_panel ON sp.PANEL_ID = gene_panel.INTERNAL_ID;
-- sample_clinical_attribute_numeric
CREATE VIEW view_sample_clinical_attribute_numeric AS
SELECT
concat(cs.CANCER_STUDY_IDENTIFIER, '_', s.STABLE_ID) as sample_unique_id,
concat(cs.CANCER_STUDY_IDENTIFIER, '_', p.STABLE_ID) as patient_unique_id,
ATTR_ID as attribute_name,
ATTR_VALUE as attribute_value,
cs.CANCER_STUDY_IDENTIFIER as cancer_study_identifier
FROM cancer_study cs
INNER JOIN patient p on cs.CANCER_STUDY_ID = p.CANCER_STUDY_ID
INNER JOIN sample s on p.INTERNAL_ID = s.PATIENT_ID
INNER JOIN clinical_sample cs on s.INTERNAL_ID = cs.INTERNAL_ID
WHERE ATTR_VALUE REGEXP '^[0-9.]+$';
-- sample_clinical_attribute_categorical
CREATE VIEW view_sample_clinical_attribute_categorical AS
SELECT
concat(cs.CANCER_STUDY_IDENTIFIER, '_', s.STABLE_ID) as sample_unique_id,
concat(cs.CANCER_STUDY_IDENTIFIER, '_', p.STABLE_ID) as patient_unique_id,
ATTR_ID as attribute_name,
ATTR_VALUE as attribute_value,
cs.CANCER_STUDY_IDENTIFIER as cancer_study_identifier
FROM cancer_study cs
INNER JOIN patient p on cs.CANCER_STUDY_ID = p.CANCER_STUDY_ID
INNER JOIN sample s on p.INTERNAL_ID = s.PATIENT_ID
INNER JOIN clinical_sample cs on s.INTERNAL_ID = cs.INTERNAL_ID
WHERE ATTR_VALUE NOT REGEXP '^[0-9.]+$';
-- patient_clinical_attribute_numeric
CREATE VIEW view_patient_clinical_attribute_numeric AS
SELECT
concat(cs.CANCER_STUDY_IDENTIFIER, '_', p.STABLE_ID) as patient_unique_id,
ATTR_ID as attribute_name,
ATTR_VALUE as attribute_value,
cs.CANCER_STUDY_IDENTIFIER as cancer_study_identifier
FROM cancer_study cs
INNER JOIN patient p on cs.CANCER_STUDY_ID = p.CANCER_STUDY_ID
INNER JOIN clinical_patient cp on p.INTERNAL_ID = cp.INTERNAL_ID
WHERE ATTR_VALUE REGEXP '^[0-9.]+$';
-- patient_clinical_attribute_categorical
CREATE VIEW view_patient_clinical_attribute_categorical AS
SELECT
concat(cs.CANCER_STUDY_IDENTIFIER, '_', p.STABLE_ID) as patient_unique_id,
ATTR_ID as attribute_name,
ATTR_VALUE as attribute_value,
cs.CANCER_STUDY_IDENTIFIER as cancer_study_identifier
FROM cancer_study cs
INNER JOIN patient p on cs.CANCER_STUDY_ID = p.CANCER_STUDY_ID
INNER JOIN clinical_patient cp on p.INTERNAL_ID = cp.INTERNAL_ID
WHERE ATTR_VALUE NOT REGEXP '^[0-9.]+$';