-
Notifications
You must be signed in to change notification settings - Fork 1.5k
/
Copy pathmake_concepts.sh
59 lines (52 loc) · 2.32 KB
/
make_concepts.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
#!/bin/bash
# This script generates the concepts in the BigQuery table mimiciv_derived.
export TARGET_DATASET=mimiciv_derived
# specify bigquery query command options
# note: max_rows=1 *displays* only one row, but all rows are inserted into the destination table
BQ_OPTIONS='--quiet --headless --max_rows=0 --use_legacy_sql=False --replace'
# generate a few tables first as the desired order isn't alphabetical
for table_path in demographics/icustay_times;
do
table=`echo $table_path | rev | cut -d/ -f1 | rev`
echo "Generating ${TARGET_DATASET}.${table}"
bq query ${BQ_OPTIONS} --destination_table=${TARGET_DATASET}.${table} < ${table_path}.sql
done
# generate tables in subfolders
# order is important for a few tables here:
# * firstday should go last
# * sepsis depends on score (sofa.sql in particular)
# * organfailure depends on measurement
for d in demographics comorbidity measurement medication organfailure treatment firstday score sepsis;
do
for fn in `ls $d`;
do
# only run SQL queries
if [[ "${fn: -4}" == ".sql" ]]; then
# table name is file name minus extension
tbl=`echo $fn | rev | cut -d. -f2- | rev`
# skip certain tables where order matters
skip=0
for skip_table in meld icustay_times first_day_sofa kdigo_stages vasoactive_agent norepinephrine_eqivalent_dose
do
if [[ "${tbl}" == "${skip_table}" ]]; then
skip=1
break
fi
done;
if [[ "${skip}" == "1" ]]; then
continue
fi
# not skipping - so generate the table on bigquery
echo "Generating ${TARGET_DATASET}.${tbl}"
bq query ${BQ_OPTIONS} --destination_table=${TARGET_DATASET}.${tbl} < ${d}/${fn}
fi
done
done
echo "Now generating tables which were skipped due to depending on other tables."
# generate tables after the above, and in a specific order to ensure dependencies are met
for table_path in firstday/first_day_sofa organfailure/kdigo_stages organfailure/meld medication/vasoactive_agent medication/norepinephrine_equivalent_dose;
do
table=`echo $table_path | rev | cut -d/ -f1 | rev`
echo "Generating ${TARGET_DATASET}.${table}"
bq query ${BQ_OPTIONS} --destination_table=${TARGET_DATASET}.${table} < ${table_path}.sql
done