Skip to content

Commit 8047c9d

Browse files
authored
Merge pull request #1425 from nragusa/updated-sql-counts
Updated row validation counts for MIMIC-IV
2 parents b3da107 + 40f4dd6 commit 8047c9d

File tree

2 files changed

+50
-50
lines changed

2 files changed

+50
-50
lines changed

mimic-iv/buildmimic/mysql/validate.sql

Lines changed: 25 additions & 26 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,5 @@
1-
-- Validate the MIMIC-IV tables built correctly by checking against known row counts.
2-
-- This script checks using the number of rows in the MIMIC-IV demo, a 100 patient subset
3-
-- of MIMIC-IV.
1+
-- Validate the MIMIC-IV tables built correctly by checking against known row counts
2+
-- of MIMIC-IV v2.1
43
SELECT
54
CASE
65
WHEN exp.row_count = obs.row_count
@@ -12,35 +11,35 @@ SELECT
1211
, exp.tbl
1312
-- expected row count - hard-coded based off known values
1413
FROM (
15-
SELECT 'admissions' AS tbl, 454324 AS row_count UNION ALL
14+
SELECT 'admissions' AS tbl, 431088 AS row_count UNION ALL
1615
SELECT 'd_hcpcs' AS tbl, 89200 AS row_count UNION ALL
1716
SELECT 'd_icd_diagnoses' AS tbl, 109775 AS row_count UNION ALL
1817
SELECT 'd_icd_procedures' AS tbl, 85257 AS row_count UNION ALL
1918
SELECT 'd_labitems' AS tbl, 1623 AS row_count UNION ALL
20-
SELECT 'diagnoses_icd' AS tbl, 5006884 AS row_count UNION ALL
21-
SELECT 'drgcodes' AS tbl, 636157 AS row_count UNION ALL
22-
SELECT 'emar' AS tbl, 28189413 AS row_count UNION ALL
23-
SELECT 'emar_detail' AS tbl, 57469291 AS row_count UNION ALL
24-
SELECT 'hcpcsevents' AS tbl, 159156 AS row_count UNION ALL
25-
SELECT 'labevents' AS tbl, 124342638 AS row_count UNION ALL
26-
SELECT 'microbiologyevents' AS tbl, 3395229 AS row_count UNION ALL
27-
SELECT 'omr' AS tbl, 6770301 AS row_count UNION ALL
28-
SELECT 'patients' AS tbl, 315460 AS row_count UNION ALL
29-
SELECT 'pharmacy' AS tbl, 14291703 AS row_count UNION ALL
30-
SELECT 'poe' AS tbl, 41427803 AS row_count UNION ALL
31-
SELECT 'poe_detail' AS tbl, 3174971 AS row_count UNION ALL
32-
SELECT 'prescriptions' AS tbl, 16219412 AS row_count UNION ALL
33-
SELECT 'procedures_icd' AS tbl, 704124 AS row_count UNION ALL
34-
SELECT 'services' AS tbl, 492967 AS row_count UNION ALL
35-
SELECT 'transfers' AS tbl, 1991704 AS row_count UNION ALL
19+
SELECT 'diagnoses_icd' AS tbl, 4752265 AS row_count UNION ALL
20+
SELECT 'drgcodes' AS tbl, 603645 AS row_count UNION ALL
21+
SELECT 'emar' AS tbl, 26743071 AS row_count UNION ALL
22+
SELECT 'emar_detail' AS tbl, 54514587 AS row_count UNION ALL
23+
SELECT 'hcpcsevents' AS tbl, 150943 AS row_count UNION ALL
24+
SELECT 'labevents' AS tbl, 118057948 AS row_count UNION ALL
25+
SELECT 'microbiologyevents' AS tbl, 3223345 AS row_count UNION ALL
26+
SELECT 'omr' AS tbl, 6422067 AS row_count UNION ALL
27+
SELECT 'patients' AS tbl, 299777 AS row_count UNION ALL
28+
SELECT 'pharmacy' AS tbl, 13568015 AS row_count UNION ALL
29+
SELECT 'poe' AS tbl, 39340661 AS row_count UNION ALL
30+
SELECT 'poe_detail' AS tbl, 3013854 AS row_count UNION ALL
31+
SELECT 'prescriptions' AS tbl, 15399811 AS row_count UNION ALL
32+
SELECT 'procedures_icd' AS tbl, 668993 AS row_count UNION ALL
33+
SELECT 'services' AS tbl, 467851 AS row_count UNION ALL
34+
SELECT 'transfers' AS tbl, 1890730 AS row_count UNION ALL
3635
-- icu data
37-
SELECT 'icustays' AS tbl, 76943 AS row_count UNION ALL
36+
SELECT 'icustays' AS tbl, 73141 AS row_count UNION ALL
3837
SELECT 'd_items' AS tbl, 4014 AS row_count UNION ALL
39-
SELECT 'chartevents' AS tbl, 329822285 AS row_count UNION ALL
40-
SELECT 'datetimeevents' AS tbl, 7477876 AS row_count UNION ALL
41-
SELECT 'inputevents' AS tbl, 9442345 AS row_count UNION ALL
42-
SELECT 'outputevents' AS tbl, 4450049 AS row_count UNION ALL
43-
SELECT 'procedureevents' AS tbl, 731788 AS row_count
38+
SELECT 'chartevents' AS tbl, 314035266 AS row_count UNION ALL
39+
SELECT 'datetimeevents' AS tbl, 7117467 AS row_count UNION ALL
40+
SELECT 'inputevents' AS tbl, 8989135 AS row_count UNION ALL
41+
SELECT 'outputevents' AS tbl, 4234697 AS row_count UNION ALL
42+
SELECT 'procedureevents' AS tbl, 696191 AS row_count
4443
) exp
4544
-- observed row count
4645
INNER JOIN

mimic-iv/buildmimic/postgres/validate.sql

Lines changed: 25 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -1,35 +1,36 @@
1-
-- Validate the MIMIC-IV tables built correctly by checking against known row counts.
1+
-- Validate the MIMIC-IV tables built correctly by checking against known row counts
2+
-- of MIMIC-IV v2.1
23
WITH expected AS
34
(
4-
SELECT 'admissions' AS tbl, 454324 AS row_count UNION ALL
5+
SELECT 'admissions' AS tbl, 431088 AS row_count UNION ALL
56
SELECT 'd_hcpcs' AS tbl, 89200 AS row_count UNION ALL
67
SELECT 'd_icd_diagnoses' AS tbl, 109775 AS row_count UNION ALL
78
SELECT 'd_icd_procedures' AS tbl, 85257 AS row_count UNION ALL
89
SELECT 'd_labitems' AS tbl, 1623 AS row_count UNION ALL
9-
SELECT 'diagnoses_icd' AS tbl, 5006884 AS row_count UNION ALL
10-
SELECT 'drgcodes' AS tbl, 636157 AS row_count UNION ALL
11-
SELECT 'emar' AS tbl, 28189413 AS row_count UNION ALL
12-
SELECT 'emar_detail' AS tbl, 57469291 AS row_count UNION ALL
13-
SELECT 'hcpcsevents' AS tbl, 159156 AS row_count UNION ALL
14-
SELECT 'labevents' AS tbl, 124342638 AS row_count UNION ALL
15-
SELECT 'microbiologyevents' AS tbl, 3395229 AS row_count UNION ALL
16-
SELECT 'omr' AS tbl, 6770301 AS row_count UNION ALL
17-
SELECT 'patients' AS tbl, 315460 AS row_count UNION ALL
18-
SELECT 'pharmacy' AS tbl, 14291703 AS row_count UNION ALL
19-
SELECT 'poe' AS tbl, 41427803 AS row_count UNION ALL
20-
SELECT 'poe_detail' AS tbl, 3174971 AS row_count UNION ALL
21-
SELECT 'prescriptions' AS tbl, 16219412 AS row_count UNION ALL
22-
SELECT 'procedures_icd' AS tbl, 704124 AS row_count UNION ALL
23-
SELECT 'services' AS tbl, 492967 AS row_count UNION ALL
24-
SELECT 'transfers' AS tbl, 1991704 AS row_count UNION ALL
10+
SELECT 'diagnoses_icd' AS tbl, 4752265 AS row_count UNION ALL
11+
SELECT 'drgcodes' AS tbl, 603645 AS row_count UNION ALL
12+
SELECT 'emar' AS tbl, 26743071 AS row_count UNION ALL
13+
SELECT 'emar_detail' AS tbl, 54514587 AS row_count UNION ALL
14+
SELECT 'hcpcsevents' AS tbl, 150943 AS row_count UNION ALL
15+
SELECT 'labevents' AS tbl, 118057948 AS row_count UNION ALL
16+
SELECT 'microbiologyevents' AS tbl, 3223345 AS row_count UNION ALL
17+
SELECT 'omr' AS tbl, 6422067 AS row_count UNION ALL
18+
SELECT 'patients' AS tbl, 299777 AS row_count UNION ALL
19+
SELECT 'pharmacy' AS tbl, 13568015 AS row_count UNION ALL
20+
SELECT 'poe' AS tbl, 39340661 AS row_count UNION ALL
21+
SELECT 'poe_detail' AS tbl, 3013854 AS row_count UNION ALL
22+
SELECT 'prescriptions' AS tbl, 15399811 AS row_count UNION ALL
23+
SELECT 'procedures_icd' AS tbl, 668993 AS row_count UNION ALL
24+
SELECT 'services' AS tbl, 467851 AS row_count UNION ALL
25+
SELECT 'transfers' AS tbl, 1890730 AS row_count UNION ALL
2526
-- icu data
26-
SELECT 'icustays' AS tbl, 76943 AS row_count UNION ALL
27+
SELECT 'icustays' AS tbl, 73141 AS row_count UNION ALL
2728
SELECT 'd_items' AS tbl, 4014 AS row_count UNION ALL
28-
SELECT 'chartevents' AS tbl, 329822285 AS row_count UNION ALL
29-
SELECT 'datetimeevents' AS tbl, 7477876 AS row_count UNION ALL
30-
SELECT 'inputevents' AS tbl, 9442345 AS row_count UNION ALL
31-
SELECT 'outputevents' AS tbl, 4450049 AS row_count UNION ALL
32-
SELECT 'procedureevents' AS tbl, 731788 AS row_count
29+
SELECT 'chartevents' AS tbl, 314035266 AS row_count UNION ALL
30+
SELECT 'datetimeevents' AS tbl, 7117467 AS row_count UNION ALL
31+
SELECT 'inputevents' AS tbl, 8989135 AS row_count UNION ALL
32+
SELECT 'outputevents' AS tbl, 4234697 AS row_count UNION ALL
33+
SELECT 'procedureevents' AS tbl, 696191 AS row_count
3334
)
3435
, observed as
3536
(

0 commit comments

Comments
 (0)