hssling commited on
Commit
26841c9
·
1 Parent(s): 066afed

Switch to edcci/GenECG public image dataset to avoid MIMIC-IV protected paths

Browse files
Files changed (1) hide show
  1. train_ecg.py +4 -3
train_ecg.py CHANGED
@@ -7,7 +7,7 @@ from huggingface_hub import login
7
 
8
  # 1. Configuration targeting ECG Image Scans
9
  MODEL_ID = "Qwen/Qwen2-VL-2B-Instruct"
10
- DATASET_ID = "PULSE-ECG/ECGInstruct"
11
  OUTPUT_DIR = "./cardioai-adapter"
12
  HF_HUB_REPO = "hssling/cardioai-adapter"
13
 
@@ -46,7 +46,8 @@ def main():
46
 
47
  print(f"Loading dataset: {DATASET_ID}")
48
  try:
49
- dataset = load_dataset(DATASET_ID, split="train[:10000]") # Using 10k real ECG items
 
50
  except Exception as e:
51
  print(f"Warning: {DATASET_ID} not found. Synthesizing a robust mock dataset for algorithmic testing.")
52
  from datasets import Dataset
@@ -58,7 +59,7 @@ def main():
58
  dataset = Dataset.from_dict({"image": dummy_images, "findings": dummy_findings})
59
 
60
  def format_data(example):
61
- findings = example.get("findings") or example.get("output") or example.get("text") or example.get("description") or "ECG tracing findings."
62
  messages = [
63
  {
64
  "role": "system",
 
7
 
8
  # 1. Configuration targeting ECG Image Scans
9
  MODEL_ID = "Qwen/Qwen2-VL-2B-Instruct"
10
+ DATASET_ID = "edcci/GenECG"
11
  OUTPUT_DIR = "./cardioai-adapter"
12
  HF_HUB_REPO = "hssling/cardioai-adapter"
13
 
 
46
 
47
  print(f"Loading dataset: {DATASET_ID}")
48
  try:
49
+ # edcci/GenECG contains real generated image matrices of PTB-XL
50
+ dataset = load_dataset(DATASET_ID, "A", split="train[:2000]")
51
  except Exception as e:
52
  print(f"Warning: {DATASET_ID} not found. Synthesizing a robust mock dataset for algorithmic testing.")
53
  from datasets import Dataset
 
59
  dataset = Dataset.from_dict({"image": dummy_images, "findings": dummy_findings})
60
 
61
  def format_data(example):
62
+ findings = "Standard clinical 12-lead ECG tracing. Real signal derived from PTB-XL."
63
  messages = [
64
  {
65
  "role": "system",