16
16
17
17
class MIMICBHCScenario (Scenario ):
18
18
"""
19
- MIMIC-IV-BHC presents a curated collection of preprocessed clinical discharge notes with labeled brief hospital course (BHC) summaries.
20
- This dataset is derived from MIMIC-IV (https://doi.org/10.1093/jamia/ocae312).
21
-
19
+ MIMIC-IV-BHC presents a curated collection of preprocessed clinical discharge notes with labeled brief
20
+ hospital course (BHC) summaries. This dataset is derived from MIMIC-IV (https://doi.org/10.1093/jamia/ocae312).
21
+
22
22
In total, the dataset contains 270,033 clinical notes.
23
23
The splits are provided by the dataset itself.
24
24
@@ -47,7 +47,7 @@ class MIMICBHCScenario(Scenario):
47
47
year={2024},
48
48
publisher={Oxford University Press}
49
49
}
50
-
50
+
51
51
@article{aali2024mimic,
52
52
title={MIMIC-IV-Ext-BHC: Labeled Clinical Notes Dataset for Hospital Course Summarization},
53
53
author={Aali, Asad and Van Veen, Dave and Arefeen, YI and Hom, Jason and Bluethgen, Christian
@@ -81,8 +81,8 @@ def get_instances(self, output_path: str) -> List[Instance]:
81
81
with open (file , "r" ) as f :
82
82
data = [json .loads (line ) for line in f ]
83
83
os .remove (file )
84
-
85
- for data_split , split in splits .items ():
84
+
85
+ for data_split , split in splits .items ():
86
86
clinical_notes : List [str ] = [x ["input" ] for x in data ]
87
87
bhc_summaries : List [str ] = [x ["target" ] for x in data ]
88
88
assert len (clinical_notes ) == len (bhc_summaries ), "Notes and summaries must have the same length"
@@ -97,4 +97,4 @@ def get_instances(self, output_path: str) -> List[Instance]:
97
97
)
98
98
)
99
99
100
- return instances
100
+ return instances
0 commit comments