forked from MIT-LCP/mimic-code
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathelixhauser_quan.sql
270 lines (234 loc) · 9.77 KB
/
elixhauser_quan.sql
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
-- This code calculates the Elixhauser comorbidities as defined in Quan et. al 2009:
-- Quan, Hude, et al. "Coding algorithms for defining comorbidities in
-- ICD-9-CM and ICD-10 administrative data." Medical care (2005): 1130-1139.
-- https://www.ncbi.nlm.nih.gov/pubmed/16224307
-- Quan defined an "Enhanced ICD-9" coding scheme for deriving Elixhauser
-- comorbidities from ICD-9 billing codes. This script implements that calculation.
-- The logic of the code is roughly that, if the comorbidity lists a length 3
-- ICD-9 code (e.g. 585), then we only require a match on the first 3 characters.
-- This code derives each comorbidity as follows:
-- 1) ICD9_CODE is directly compared to 5 character codes
-- 2) The first 4 characters of ICD9_CODE are compared to 4 character codes
-- 3) The first 3 characters of ICD9_CODE are compared to 3 character codes
with eliflg as
(
select hadm_id, seq_num, icd9_code
, CASE
when icd9_code in ('39891','40201','40211','40291','40401','40403','40411','40413','40491','40493') then 1
when SUBSTR(icd9_code, 1, 4) in ('4254','4255','4257','4258','4259') then 1
when SUBSTR(icd9_code, 1, 3) in ('428') then 1
else 0 end as chf /* Congestive heart failure */
, CASE
when icd9_code in ('42613','42610','42612','99601','99604') then 1
when SUBSTR(icd9_code, 1, 4) in ('4260','4267','4269','4270','4271','4272','4273','4274','4276','4278','4279','7850','V450','V533') then 1
else 0 end as arrhy
, CASE
when SUBSTR(icd9_code, 1, 4) in ('0932','7463','7464','7465','7466','V422','V433') then 1
when SUBSTR(icd9_code, 1, 3) in ('394','395','396','397','424') then 1
else 0 end as valve /* Valvular disease */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('4150','4151','4170','4178','4179') then 1
when SUBSTR(icd9_code, 1, 3) in ('416') then 1
else 0 end as pulmcirc /* Pulmonary circulation disorder */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('0930','4373','4431','4432','4438','4439','4471','5571','5579','V434') then 1
when SUBSTR(icd9_code, 1, 3) in ('440','441') then 1
else 0 end as perivasc /* Peripheral vascular disorder */
, CASE
when SUBSTR(icd9_code, 1, 3) in ('401') then 1
else 0 end as htn /* Hypertension, uncomplicated */
, CASE
when SUBSTR(icd9_code, 1, 3) in ('402','403','404','405') then 1
else 0 end as htncx /* Hypertension, complicated */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('3341','3440','3441','3442','3443','3444','3445','3446','3449') then 1
when SUBSTR(icd9_code, 1, 3) in ('342','343') then 1
else 0 end as para /* Paralysis */
, CASE
when icd9_code in ('33392') then 1
when SUBSTR(icd9_code, 1, 4) in ('3319','3320','3321','3334','3335','3362','3481','3483','7803','7843') then 1
when SUBSTR(icd9_code, 1, 3) in ('334','335','340','341','345') then 1
else 0 end as neuro /* Other neurological */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('4168','4169','5064','5081','5088') then 1
when SUBSTR(icd9_code, 1, 3) in ('490','491','492','493','494','495','496','500','501','502','503','504','505') then 1
else 0 end as chrnlung /* Chronic pulmonary disease */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('2500','2501','2502','2503') then 1
else 0 end as dm /* Diabetes w/o chronic complications*/
, CASE
when SUBSTR(icd9_code, 1, 4) in ('2504','2505','2506','2507','2508','2509') then 1
else 0 end as dmcx /* Diabetes w/ chronic complications */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('2409','2461','2468') then 1
when SUBSTR(icd9_code, 1, 3) in ('243','244') then 1
else 0 end as hypothy /* Hypothyroidism */
, CASE
when icd9_code in ('40301','40311','40391','40402','40403','40412','40413','40492','40493') then 1
when SUBSTR(icd9_code, 1, 4) in ('5880','V420','V451') then 1
when SUBSTR(icd9_code, 1, 3) in ('585','586','V56') then 1
else 0 end as renlfail /* Renal failure */
, CASE
when icd9_code in ('07022','07023','07032','07033','07044','07054') then 1
when SUBSTR(icd9_code, 1, 4) in ('0706','0709','4560','4561','4562','5722','5723','5724','5728','5733','5734','5738','5739','V427') then 1
when SUBSTR(icd9_code, 1, 3) in ('570','571') then 1
else 0 end as liver /* Liver disease */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('5317','5319','5327','5329','5337','5339','5347','5349') then 1
else 0 end as ulcer /* Chronic Peptic ulcer disease (includes bleeding only if obstruction is also present) */
, CASE
when SUBSTR(icd9_code, 1, 3) in ('042','043','044') then 1
else 0 end as aids /* HIV and AIDS */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('2030','2386') then 1
when SUBSTR(icd9_code, 1, 3) in ('200','201','202') then 1
else 0 end as lymph /* Lymphoma */
, CASE
when SUBSTR(icd9_code, 1, 3) in ('196','197','198','199') then 1
else 0 end as mets /* Metastatic cancer */
, CASE
when SUBSTR(icd9_code, 1, 3) in
(
'140','141','142','143','144','145','146','147','148','149','150','151','152'
,'153','154','155','156','157','158','159','160','161','162','163','164','165'
,'166','167','168','169','170','171','172','174','175','176','177','178','179'
,'180','181','182','183','184','185','186','187','188','189','190','191','192'
,'193','194','195'
) then 1
else 0 end as tumor /* Solid tumor without metastasis */
, CASE
when icd9_code in ('72889','72930') then 1
when SUBSTR(icd9_code, 1, 4) in ('7010','7100','7101','7102','7103','7104','7108','7109','7112','7193','7285') then 1
when SUBSTR(icd9_code, 1, 3) in ('446','714','720','725') then 1
else 0 end as arth /* Rheumatoid arthritis/collagen vascular diseases */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('2871','2873','2874','2875') then 1
when SUBSTR(icd9_code, 1, 3) in ('286') then 1
else 0 end as coag /* Coagulation deficiency */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('2780') then 1
else 0 end as obese /* Obesity */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('7832','7994') then 1
when SUBSTR(icd9_code, 1, 3) in ('260','261','262','263') then 1
else 0 end as wghtloss /* Weight loss */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('2536') then 1
when SUBSTR(icd9_code, 1, 3) in ('276') then 1
else 0 end as lytes /* Fluid and electrolyte disorders */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('2800') then 1
else 0 end as bldloss /* Blood loss anemia */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('2801','2808','2809') then 1
when SUBSTR(icd9_code, 1, 3) in ('281') then 1
else 0 end as anemdef /* Deficiency anemias */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('2652','2911','2912','2913','2915','2918','2919','3030','3039','3050','3575','4255','5353','5710','5711','5712','5713','V113') then 1
when SUBSTR(icd9_code, 1, 3) in ('980') then 1
else 0 end as alcohol /* Alcohol abuse */
, CASE
when icd9_code in ('V6542') then 1
when SUBSTR(icd9_code, 1, 4) in ('3052','3053','3054','3055','3056','3057','3058','3059') then 1
when SUBSTR(icd9_code, 1, 3) in ('292','304') then 1
else 0 end as drug /* Drug abuse */
, CASE
when icd9_code in ('29604','29614','29644','29654') then 1
when SUBSTR(icd9_code, 1, 4) in ('2938') then 1
when SUBSTR(icd9_code, 1, 3) in ('295','297','298') then 1
else 0 end as psych /* Psychoses */
, CASE
when SUBSTR(icd9_code, 1, 4) in ('2962','2963','2965','3004') then 1
when SUBSTR(icd9_code, 1, 3) in ('309','311') then 1
else 0 end as depress /* Depression */
from `physionet-data.mimiciii_clinical.diagnoses_icd` icd
where seq_num != 1 -- we do not include the primary icd-9 code
)
-- collapse the icd9_code specific flags into hadm_id specific flags
-- this groups comorbidities together for a single patient admission
, eligrp as
(
select hadm_id
, max(chf) as chf
, max(arrhy) as arrhy
, max(valve) as valve
, max(pulmcirc) as pulmcirc
, max(perivasc) as perivasc
, max(htn) as htn
, max(htncx) as htncx
, max(para) as para
, max(neuro) as neuro
, max(chrnlung) as chrnlung
, max(dm) as dm
, max(dmcx) as dmcx
, max(hypothy) as hypothy
, max(renlfail) as renlfail
, max(liver) as liver
, max(ulcer) as ulcer
, max(aids) as aids
, max(lymph) as lymph
, max(mets) as mets
, max(tumor) as tumor
, max(arth) as arth
, max(coag) as coag
, max(obese) as obese
, max(wghtloss) as wghtloss
, max(lytes) as lytes
, max(bldloss) as bldloss
, max(anemdef) as anemdef
, max(alcohol) as alcohol
, max(drug) as drug
, max(psych) as psych
, max(depress) as depress
from eliflg
group by hadm_id
)
-- now merge these flags together to define elixhauser
-- most are straightforward.. but hypertension flags are a bit more complicated
select adm.hadm_id
, chf as congestive_heart_failure
, arrhy as cardiac_arrhythmias
, valve as valvular_disease
, pulmcirc as pulmonary_circulation
, perivasc as peripheral_vascular
-- we combine "htn" and "htncx" into "HYPERTENSION"
, case
when htn = 1 then 1
when htncx = 1 then 1
else 0 end as hypertension
, para as paralysis
, neuro as other_neurological
, chrnlung as chronic_pulmonary
-- only the more severe comorbidity (complicated diabetes) is kept
, case
when dmcx = 1 then 0
when dm = 1 then 1
else 0 end as diabetes_uncomplicated
, dmcx as diabetes_complicated
, hypothy as hypothyroidism
, renlfail as renal_failure
, liver as liver_disease
, ulcer as peptic_ulcer
, aids as aids
, lymph as lymphoma
, mets as metastatic_cancer
-- only the more severe comorbidity (metastatic cancer) is kept
, case
when mets = 1 then 0
when tumor = 1 then 1
else 0 end as solid_tumor
, arth as rheumatoid_arthritis
, coag as coagulopathy
, obese as obesity
, wghtloss as weight_loss
, lytes as fluid_electrolyte
, bldloss as blood_loss_anemia
, anemdef as deficiency_anemias
, alcohol as alcohol_abuse
, drug as drug_abuse
, psych as psychoses
, depress as depression
FROM `physionet-data.mimiciii_clinical.admissions` adm
left join eligrp eli
on adm.hadm_id = eli.hadm_id
order by adm.hadm_id;