diff --git a/src/MEDS_DEV/datasets/eICU/README.md b/src/MEDS_DEV/datasets/eICU/README.md new file mode 100644 index 0000000..170d601 --- /dev/null +++ b/src/MEDS_DEV/datasets/eICU/README.md @@ -0,0 +1,33 @@ +# eICU Collaborative Research Database + +## Description + +The eICU Collaborative Research Database is a multi-center database comprising de-identified health data associated with over 200,000 admissions to ICUs across the United States between 2014-2015. The database includes vital sign measurements, care plan documentation, severity of illness measures, diagnosis information, and treatment information. Data is collected through the Philips eICU program, a critical care telehealth program that delivers information to caregivers at the bedside.[1] + +## Access Requirements + +Taken from [PhysioNet](https://physionet.org/content/eicu-crd/2.0/): + +- **Access Policy**: Complete the credentialed data access requirements on PhysioNet[2] +- **License (for files)**: PhysioNet Credentialed Health Data License Version 1.5.0[2] +- **Data Use Agreement**: Agreement requires verified institutional affiliation and commitment to use data solely for lawful scientific research[2] +- **Required training**: Valid CITI training certification in human research subject protection and HIPAA regulations[2] +- **License Term**: 3 years from account creation date[2] +- **Code Sharing**: Agreement to contribute code associated with publications to open research repository[2] + +## Supported Tasks + +- `tasks/mortality/in_icu/first_24h.yaml` + +## MEDS-transformation + +eICU is available in three formats: Original (compatible with benchmark repository), MEDS (Medical Event Data Standard), and OMOP (full OMOP table dumps). The MEDS version contains the same exact data as the Original dataset but in MEDS-compatible format.[1] + +## Sources + +1. [eICU Physionet Repository](https://physionet.org/content/eicu-crd/2.0/) +2. [PhysioNet Credentialed Access](https://physionet.org/content/eicu-crd/view-license/2.0/) + +## Disclaimer + +Please refer to the data owners and the most up-to-date information when using this dataset in your research. The eICU dataset has not been reviewed or approved by the Food and Drug Administration and is for non-clinical, research and education use only.[2] diff --git a/src/MEDS_DEV/datasets/eICU/dataset.yaml b/src/MEDS_DEV/datasets/eICU/dataset.yaml new file mode 100644 index 0000000..89a86da --- /dev/null +++ b/src/MEDS_DEV/datasets/eICU/dataset.yaml @@ -0,0 +1,23 @@ +metadata: + description: >- + A MEDS version of eICU. + links: + - https://github.com/Medical-Event-Data-Standard/eICU_MEDS + - https://physionet.org/content/eicu-crd/ + contacts: + - name: "Robin P. van de Water" + github_username: "rvandewater" +commands: + build_full: >- + MEDS_extract-eICU + raw_input_dir="{temp_dir}/raw" + pre_MEDS_dir="{temp_dir}/pre_MEDS" + MEDS_cohort_dir="{output_dir}" + log_dir="{output_dir}/.pipeline_logs" + build_demo: >- + MEDS_extract-eICU + do_demo=True + raw_input_dir="{temp_dir}/raw" + pre_MEDS_dir="{temp_dir}/pre_MEDS" + MEDS_cohort_dir="{output_dir}" + log_dir="{output_dir}/.pipeline_logs" diff --git a/src/MEDS_DEV/datasets/eICU/predicates.yaml b/src/MEDS_DEV/datasets/eICU/predicates.yaml new file mode 100644 index 0000000..ca69557 --- /dev/null +++ b/src/MEDS_DEV/datasets/eICU/predicates.yaml @@ -0,0 +1,162 @@ +predicates: + hospital_admission: + code: { regex: "^HOSPITAL_ADMISSION//.*" } + hospital_discharge: + code: { regex: "^HOSPITAL_DISCHARGE//.*" } + + ED_registration: + code: { regex: "^ED_REGISTRATION//.*" } + ED_discharge: + code: { regex: "^ED_OUT//.*" } + + icu_admission: + code: { regex: "^ICU_ADMISSION//.*" } + icu_discharge: + code: { regex: "^ICU_DISCHARGE//.*" } + + creatinine_1: + code: LAB//50912//mg/dL + creatinine_2: + code: LAB//52546//mg/dL + abnormally_high_creatinine_1: + code: LAB//50912//mg/dL + value_min: 1.3 # mg/dL + value_min_inclusive: False + value_max: null + abnormally_high_creatinine_2: + code: LAB//52546//mg/dL + value_min: 1.3 # mg/dL + value_min_inclusive: False + value_max: null + creatinine: + expr: or(creatinine_1, creatinine_2) + abnormally_high_creatinine: + expr: or(abnormally_high_creatinine_1, abnormally_high_creatinine_2) + + sodium_1: + code: LAB//220645//mEq/L + sodium_2: + code: LAB//50983//mEq/L + sodium_3: + code: LAB//52623//mEq/L + abnormally_low_sodium_1: + code: LAB//220645//mEq/L + value_min: null + value_max: 135 # mEq/L + value_max_inclusive: False + abnormally_low_sodium_2: + code: LAB//50983//mEq/L + value_min: null + value_max: 135 # mEq/L + value_max_inclusive: False + abnormally_low_sodium_3: + code: LAB//52623//mEq/L + value_min: null + value_max: 135 # mEq/L + value_max_inclusive: False + sodium: + expr: or(sodium_1, sodium_2, sodium_3) + abnormally_low_sodium: + expr: or(abnormally_low_sodium_1, abnormally_low_sodium_2, abnormally_low_sodium_3) + + bicarbonate_1: + code: LAB//227443//mEq/L + bicarbonate_2: + code: LAB//50882//mEq/L + abnormally_low_bicarbonate_1: + code: LAB//227443//mEq/L + value_min: null + value_max: 22 # mEq/L + value_max_inclusive: False + abnormally_low_bicarbonate_2: + code: LAB//50882//mEq/L + value_min: null + value_max: 22 # mEq/L + value_max_inclusive: False + bicarbonate: + expr: or(bicarbonate_1, bicarbonate_2) + abnormally_low_bicarbonate: + expr: or(abnormally_low_bicarbonate_1, abnormally_low_bicarbonate_2) + + hemoglobin_1: + code: LAB//220228//g/dl + hemoglobin_2: + code: LAB//50811//g/dL + abnormally_low_hemoglobin_1: + code: LAB//220228//g/dl + value_min: null + value_max: 13 # g/dL + value_max_inclusive: False + abnormally_low_hemoglobin_2: + code: LAB//50811//g/dL + value_min: null + value_max: 13 # g/dL + value_max_inclusive: False + hemoglobin: + expr: or(hemoglobin_1, hemoglobin_2) + abnormally_low_hemoglobin: + expr: or(abnormally_low_hemoglobin_1, abnormally_low_hemoglobin_2) + + wbc_1: + code: LAB//220546//K/uL + wbc_2: + code: LAB//51300//K/uL + abnormally_high_wbc_1: + code: LAB//220546//K/uL + value_min: 11 # K/uL + value_min_inclusive: False + value_max: null + abnormally_high_wbc_2: + code: LAB//51300//K/uL + value_min: 11 # K/uL + value_min_inclusive: False + value_max: null + wbc: + expr: or(wbc_1, wbc_2) + abnormally_high_wbc: + expr: or(abnormally_high_wbc_1, abnormally_high_wbc_2) + + platelets_1: + code: LAB//227457//K/uL + platelets_2: + code: LAB//51265//K/uL + abnormally_low_platelets_1: + code: LAB//227457//K/uL + value_min: null + value_max: 150 # K/uL + value_max_inclusive: False + abnormally_low_platelets_2: + code: LAB//51265//K/uL + value_min: null + value_max: 150 # K/uL + value_max_inclusive: False + platelets: + expr: or(platelets_1, platelets_2) + abnormally_low_platelets: + expr: or(abnormally_low_platelets_1, abnormally_low_platelets_2) + + map_1: + code: LAB//220052//mmHg + map_2: + code: LAB//220181//mmHg + map_3: + code: LAB//225312//mmHg + abnormally_low_map_1: + code: LAB//220052//mmHg + value_min: null + value_max: 65 # mmHg + value_max_inclusive: False + abnormally_low_map_2: + code: LAB//220181//mmHg + value_min: null + value_max: 65 # mmHg + value_max_inclusive: False + abnormally_low_map_3: + code: LAB//225312//mmHg + value_min: null + value_max: 65 # mmHg + value_max_inclusive: False + map: + expr: or(map_1, map_2, map_3) + abnormally_low_map: + expr: or(abnormally_low_map_1, abnormally_low_map_2, abnormally_low_map_3) diff --git a/src/MEDS_DEV/datasets/eICU/refs.bib b/src/MEDS_DEV/datasets/eICU/refs.bib new file mode 100644 index 0000000..d28eabd --- /dev/null +++ b/src/MEDS_DEV/datasets/eICU/refs.bib @@ -0,0 +1,15 @@ +@article{pollardEICUCollaborativeResearch2018, + title = {The {{eICU Collaborative Research Database}}, a Freely Available Multi-Center Database for Critical Care Research}, + author = {Pollard, Tom J. and Johnson, Alistair E. W. and Raffa, Jesse D. and Celi, Leo A. and Mark, Roger G. and Badawi, Omar}, + year = 2018, + month = dec, + journal = {Scientific Data}, + volume = {5}, + number = {1}, + pages = {180178}, + issn = {2052-4463}, + doi = {10.1038/sdata.2018.178}, + urldate = {2022-03-09}, + langid = {english}, + keywords = {_tablet}, +} diff --git a/src/MEDS_DEV/datasets/eICU/requirements.txt b/src/MEDS_DEV/datasets/eICU/requirements.txt new file mode 100644 index 0000000..602edaf --- /dev/null +++ b/src/MEDS_DEV/datasets/eICU/requirements.txt @@ -0,0 +1 @@ +eICU-MEDS==0.0.2