File size: 347 Bytes
d51135f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
from datasets import load_dataset

def load_discharge_notes():
    notes = load_dataset(
        "ntphuc149/MIMIC-III-Clinical-Database",
        "NOTEEVENTS",
        split="train"
    )

    # Filter only discharge summaries
    notes = notes.filter(
        lambda x: x["CATEGORY"] == "Discharge summary"
    )

    return notes