{
  "cells": [
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "p-fvcK3rZHoK",
        "outputId": "452c5e35-056d-4bdb-d921-a634d510638b"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Mounted at /content/drive\n"
          ]
        }
      ],
      "source": [
        "from google.colab import drive\n",
        "drive.mount('/content/drive',force_remount=True)\n",
        "\n",
        "root = \"/content/drive/MyDrive/SPRSound/SPRSound-main\"\n",
        "# Set device\n",
        "train_mode=True\n",
        "test_mode=False\n",
        "split_data=False"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "nhv5GGqEZtqY",
        "outputId": "a6b22e3c-f3c3-480a-d07d-836a8b30fc0d"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Cloning into 'hear'...\n",
            "remote: Enumerating objects: 216, done.\u001b[K\n",
            "remote: Counting objects: 100% (87/87), done.\u001b[K\n",
            "remote: Compressing objects: 100% (40/40), done.\u001b[K\n",
            "remote: Total 216 (delta 72), reused 47 (delta 47), pack-reused 129 (from 1)\u001b[K\n",
            "Receiving objects: 100% (216/216), 62.06 MiB | 19.19 MiB/s, done.\n",
            "Resolving deltas: 100% (128/128), done.\n"
          ]
        }
      ],
      "source": [
        "import os\n",
        "if not os.path.exists('/content/hear'):\n",
        "  !git clone https://github.com/Google-Health/hear"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "iX_h8XZMZNhg"
      },
      "outputs": [],
      "source": [
        "import torch\n",
        "import torch.nn as nn\n",
        "import torch.nn.functional as F\n",
        "from torch.utils.data import Dataset,DataLoader,WeightedRandomSampler\n",
        "from transformers import AutoModel\n",
        "import math\n",
        "import os\n",
        "import sys\n",
        "import json\n",
        "import pandas as pd\n",
        "import numpy as np\n",
        "from tqdm import tqdm\n",
        "from pathlib import Path\n",
        "import torchaudio\n",
        "import importlib\n",
        "from typing import Optional, Dict, List\n",
        "from collections import Counter\n",
        "from sklearn.model_selection import train_test_split\n",
        "from sklearn.metrics import (\n",
        "    accuracy_score,\n",
        "    f1_score,\n",
        "    precision_score,\n",
        "    recall_score,\n",
        "    confusion_matrix,\n",
        "    classification_report,\n",
        "    roc_auc_score\n",
        ")\n",
        "from sklearn.preprocessing import label_binarize\n",
        "import matplotlib.pyplot as plt\n",
        "import seaborn as sns\n",
        "from torch.nn.utils.rnn import pack_padded_sequence\n",
        "import regex as re\n",
        "import random"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "q4H9-8vsoZwF"
      },
      "outputs": [],
      "source": [
        "###### train test split - one time run ######\n",
        "\n",
        "def collect_all_samples(root_dir: str, consolidate_labels: bool = True) -> pd.DataFrame:\n",
        "    \"\"\"\n",
        "    Collect all samples from all BioCAS years (2022-2025) into a single DataFrame.\n",
        "\n",
        "    Args:\n",
        "        root_dir: Path to SPRSound dataset root\n",
        "        consolidate_labels: Whether to consolidate rare labels into main classes\n",
        "\n",
        "    Returns:\n",
        "        DataFrame with columns: wav_path, json_path, filename, year, original_split, event_types, label, original_label\n",
        "    \"\"\"\n",
        "    root_dir = Path(root_dir)\n",
        "    all_samples = []\n",
        "\n",
        "    # Define all available datasets\n",
        "    datasets = [\n",
        "        ('2022', 'train', None),\n",
        "        ('2022', 'test', 'inter'),\n",
        "        ('2022', 'test', 'intra'),\n",
        "        ('2023', 'test', None),\n",
        "        ('2024', 'test', None),\n",
        "        ('2025', 'test', None),\n",
        "    ]\n",
        "\n",
        "    print(\"=\"*80)\n",
        "    print(\"COLLECTING ALL SAMPLES FROM ALL YEARS\")\n",
        "    print(\"=\"*80)\n",
        "\n",
        "    for year, split, test_type in datasets:\n",
        "        year_dir = root_dir / f\"BioCAS{year}\"\n",
        "\n",
        "        # Set paths\n",
        "        if split == 'train':\n",
        "            wav_dir = year_dir / f\"train{year}_wav\"\n",
        "            json_dir = year_dir / f\"train{year}_json\"\n",
        "            split_name = f\"{year}_train\"\n",
        "        else:  # test\n",
        "            wav_dir = year_dir / f\"test{year}_wav\"\n",
        "\n",
        "            if year == '2022' and test_type:\n",
        "                if test_type == 'inter':\n",
        "                    json_dir = year_dir / f\"test{year}_json\" / \"inter_test_json\"\n",
        "                    split_name = f\"{year}_test_inter\"\n",
        "                else:  # intra\n",
        "                    json_dir = year_dir / f\"test{year}_json\" / \"intra_test_json\"\n",
        "                    split_name = f\"{year}_test_intra\"\n",
        "            else:\n",
        "                json_dir = year_dir / f\"test{year}_json\"\n",
        "                split_name = f\"{year}_test\"\n",
        "\n",
        "        # Check if directories exist\n",
        "        if not wav_dir.exists() or not json_dir.exists():\n",
        "            print(f\"Skipping {split_name}: directories not found\")\n",
        "            continue\n",
        "\n",
        "        # Load all JSON files\n",
        "        json_files = sorted(json_dir.glob(\"*.json\"))\n",
        "        print(f\"\\nProcessing {split_name}: {len(json_files)} files\")\n",
        "\n",
        "        for json_path in json_files:\n",
        "            with open(json_path, 'r') as f:\n",
        "                annotation = json.load(f)\n",
        "\n",
        "            # Get corresponding WAV filename\n",
        "            wav_filename = json_path.stem + '.wav'\n",
        "            wav_path = wav_dir / wav_filename\n",
        "\n",
        "            if not wav_path.exists():\n",
        "                print(f\"Warning: WAV file not found: {wav_path}\")\n",
        "                continue\n",
        "\n",
        "            # Extract event types\n",
        "            events = annotation.get('event_annotation', [])\n",
        "            event_types = [event.get('type', '') for event in events]\n",
        "\n",
        "            # Parse original label (detailed)\n",
        "            original_label = _parse_label_detailed(event_types)\n",
        "\n",
        "            # Parse consolidated label\n",
        "            if consolidate_labels:\n",
        "                label = _consolidate_label(original_label)\n",
        "            else:\n",
        "                label = original_label\n",
        "\n",
        "            sample = {\n",
        "                'wav_path': str(wav_path),\n",
        "                'json_path': str(json_path),\n",
        "                'filename': wav_filename,\n",
        "                'year': year,\n",
        "                'original_split': split_name,\n",
        "                'event_types': '|'.join(event_types),  # Store as pipe-separated string\n",
        "                'original_label': original_label,\n",
        "                'label': label\n",
        "            }\n",
        "\n",
        "            all_samples.append(sample)\n",
        "\n",
        "        print(f\"  Collected {len(json_files)} samples from {split_name}\")\n",
        "\n",
        "    # Create DataFrame\n",
        "    df = pd.DataFrame(all_samples)\n",
        "\n",
        "    print(f\"\\n{'='*80}\")\n",
        "    print(f\"TOTAL SAMPLES COLLECTED: {len(df)}\")\n",
        "    print(f\"{'='*80}\")\n",
        "\n",
        "    # Print statistics\n",
        "    print(\"\\nSamples per year:\")\n",
        "    print(df['year'].value_counts().sort_index())\n",
        "\n",
        "    print(\"\\nSamples per original split:\")\n",
        "    print(df['original_split'].value_counts())\n",
        "\n",
        "    if consolidate_labels:\n",
        "        print(\"\\nOriginal label distribution (before consolidation):\")\n",
        "        print(df['original_label'].value_counts())\n",
        "\n",
        "        print(\"\\nConsolidated label distribution:\")\n",
        "        print(df['label'].value_counts())\n",
        "\n",
        "        # Show mapping\n",
        "        print(\"\\nLabel consolidation mapping:\")\n",
        "        mapping = df.groupby('original_label')['label'].first().to_dict()\n",
        "        for orig, consol in sorted(mapping.items()):\n",
        "            if orig != consol:\n",
        "                count = (df['original_label'] == orig).sum()\n",
        "                print(f\"  {orig} -> {consol} ({count} samples)\")\n",
        "    else:\n",
        "        print(\"\\nLabel distribution:\")\n",
        "        print(df['label'].value_counts())\n",
        "\n",
        "    return df\n",
        "\n",
        "\n",
        "def _parse_label_detailed(event_types: List[str]) -> str:\n",
        "    \"\"\"Parse detailed label from event types (preserves all combinations)\"\"\"\n",
        "    if not event_types:\n",
        "        return 'normal'\n",
        "\n",
        "    # Get unique event types\n",
        "    unique_events = list(set(event_types))\n",
        "\n",
        "    # Remove 'Normal' from the list\n",
        "    non_normal_events = [e for e in unique_events if e.lower() != 'normal']\n",
        "\n",
        "    # If no abnormal events, label as normal\n",
        "    if not non_normal_events:\n",
        "        return 'normal'\n",
        "\n",
        "    # Sort and join non-normal events\n",
        "    sorted_events = sorted([e.lower() for e in non_normal_events])\n",
        "\n",
        "    return '+'.join(sorted_events)\n",
        "\n",
        "\n",
        "def _consolidate_label(original_label: str) -> str:\n",
        "\n",
        "    label_lower = original_label.lower()\n",
        "\n",
        "    # Normal case\n",
        "    if label_lower == 'normal':\n",
        "        return 'normal'\n",
        "    return \"abnormal\"\n",
        "\n",
        "def extract_patient_id(filename: str) -> str:\n",
        "    \"\"\"\n",
        "    Extract patient ID from filename.\n",
        "\n",
        "    Filename pattern: PATIENTID_X.X_X_pX_XXXX.wav\n",
        "    Example: 41055397_3.0_0_p3_10805.wav -> patient_id = 41055397\n",
        "\n",
        "    Args:\n",
        "        filename: Audio filename\n",
        "\n",
        "    Returns:\n",
        "        Patient ID string, or None if pattern doesn't match\n",
        "    \"\"\"\n",
        "    match = re.match(r'(\\d+)_', filename)\n",
        "    if match:\n",
        "        return match.group(1)\n",
        "    return None\n",
        "\n",
        "\n",
        "def create_patient_level_splits(\n",
        "    df: pd.DataFrame,\n",
        "    train_ratio: float = 0.7,\n",
        "    val_ratio: float = 0.15,\n",
        "    test_ratio: float = 0.15,\n",
        "    random_state: int = 42,\n",
        "    min_samples_per_class: int = 10\n",
        ") -> tuple[pd.DataFrame, pd.DataFrame, pd.DataFrame]:\n",
        "    \"\"\"\n",
        "    Create patient-level stratified splits to prevent data leakage.\n",
        "\n",
        "    CRITICAL: This ensures NO patient appears in multiple splits.\n",
        "    Each patient's recordings all go into the same split (train/val/test).\n",
        "\n",
        "    Args:\n",
        "        df: DataFrame with all samples\n",
        "        train_ratio: Proportion for training (default: 0.7)\n",
        "        val_ratio: Proportion for validation (default: 0.15)\n",
        "        test_ratio: Proportion for test (default: 0.15)\n",
        "        random_state: Random seed for reproducibility\n",
        "        min_samples_per_class: Minimum samples for stratification\n",
        "\n",
        "    Returns:\n",
        "        train_df, val_df, test_df with NO patient overlap\n",
        "    \"\"\"\n",
        "    assert abs(train_ratio + val_ratio + test_ratio - 1.0) < 1e-6, \"Ratios must sum to 1.0\"\n",
        "\n",
        "    print(f\"\\n{'='*80}\")\n",
        "    print(\"CREATING PATIENT-LEVEL STRATIFIED SPLITS (NO LEAKAGE)\")\n",
        "    print(f\"{'='*80}\")\n",
        "    print(f\"Train ratio: {train_ratio:.2f}\")\n",
        "    print(f\"Val ratio: {val_ratio:.2f}\")\n",
        "    print(f\"Test ratio: {test_ratio:.2f}\")\n",
        "    print(f\"Random state: {random_state}\")\n",
        "\n",
        "    # Extract patient IDs\n",
        "    df = df.copy()\n",
        "    df['patient_id'] = df['filename'].apply(extract_patient_id)\n",
        "\n",
        "    # Remove samples without patient ID\n",
        "    samples_without_id = df['patient_id'].isna().sum()\n",
        "    if samples_without_id > 0:\n",
        "        print(f\"\\n⚠️  Warning: {samples_without_id} samples without patient ID will be excluded\")\n",
        "        df = df[df['patient_id'].notna()].copy()\n",
        "\n",
        "    print(f\"\\nDataset statistics:\")\n",
        "    print(f\"  Total samples: {len(df)}\")\n",
        "    print(f\"  Unique patients: {df['patient_id'].nunique()}\")\n",
        "\n",
        "    # Group by patient and determine each patient's characteristics\n",
        "    patient_data = []\n",
        "\n",
        "    for patient_id in df['patient_id'].unique():\n",
        "        patient_samples = df[df['patient_id'] == patient_id]\n",
        "\n",
        "        # Get the majority label for this patient (for stratification)\n",
        "        label_counts = patient_samples['label'].value_counts()\n",
        "        majority_label = label_counts.index[0]\n",
        "\n",
        "        # Also track if patient has multiple labels\n",
        "        has_multiple_labels = len(patient_samples['label'].unique()) > 1\n",
        "\n",
        "        patient_data.append({\n",
        "            'patient_id': patient_id,\n",
        "            'majority_label': majority_label,\n",
        "            'num_samples': len(patient_samples),\n",
        "            'unique_labels': patient_samples['label'].nunique(),\n",
        "            'all_labels': list(patient_samples['label'].unique())\n",
        "        })\n",
        "\n",
        "    patient_df = pd.DataFrame(patient_data)\n",
        "\n",
        "    print(f\"\\nPatient-level statistics:\")\n",
        "    print(f\"  Total patients: {len(patient_df)}\")\n",
        "    print(f\"  Patients with multiple labels: {(patient_df['unique_labels'] > 1).sum()}\")\n",
        "    print(f\"  Average samples per patient: {patient_df['num_samples'].mean():.2f}\")\n",
        "    print(f\"  Median samples per patient: {patient_df['num_samples'].median():.0f}\")\n",
        "\n",
        "    print(f\"\\nMajority label distribution across patients:\")\n",
        "    print(patient_df['majority_label'].value_counts())\n",
        "\n",
        "    # Handle rare classes by grouping for stratification\n",
        "    label_counts = patient_df['majority_label'].value_counts()\n",
        "    rare_labels = label_counts[label_counts < min_samples_per_class].index.tolist()\n",
        "\n",
        "    def group_labels_for_stratification(label):\n",
        "        \"\"\"Group rare labels for better stratification\"\"\"\n",
        "        if label in rare_labels:\n",
        "            return 'rare'\n",
        "        return label\n",
        "\n",
        "    patient_df['stratify_label'] = patient_df['majority_label'].apply(\n",
        "        group_labels_for_stratification\n",
        "    )\n",
        "\n",
        "    if rare_labels:\n",
        "        print(f\"\\n⚠️  Rare labels grouped for stratification:\")\n",
        "        for label in rare_labels:\n",
        "            count = (patient_df['majority_label'] == label).sum()\n",
        "            print(f\"  {label}: {count} patients\")\n",
        "\n",
        "    # PATIENT-LEVEL SPLIT (not sample-level!)\n",
        "    # Step 1: Split patients into train and temp (val+test)\n",
        "    train_patients, temp_patients = train_test_split(\n",
        "        patient_df['patient_id'].values,\n",
        "        test_size=(val_ratio + test_ratio),\n",
        "        random_state=random_state,\n",
        "        stratify=patient_df['stratify_label'].values\n",
        "    )\n",
        "\n",
        "    # Step 2: Split temp patients into val and test\n",
        "    temp_patient_df = patient_df[patient_df['patient_id'].isin(temp_patients)]\n",
        "\n",
        "    # Adjust val ratio for the temp split\n",
        "    val_ratio_adjusted = val_ratio / (val_ratio + test_ratio)\n",
        "\n",
        "    val_patients, test_patients = train_test_split(\n",
        "        temp_patients,\n",
        "        test_size=(1 - val_ratio_adjusted),\n",
        "        random_state=random_state,\n",
        "        stratify=temp_patient_df['stratify_label'].values\n",
        "    )\n",
        "\n",
        "    # Convert to sets for fast lookup\n",
        "    train_patient_set = set(train_patients)\n",
        "    val_patient_set = set(val_patients)\n",
        "    test_patient_set = set(test_patients)\n",
        "\n",
        "    # Assign samples to splits based on patient ID\n",
        "    def assign_split(patient_id):\n",
        "        if patient_id in train_patient_set:\n",
        "            return 'train'\n",
        "        elif patient_id in val_patient_set:\n",
        "            return 'val'\n",
        "        elif patient_id in test_patient_set:\n",
        "            return 'test'\n",
        "        else:\n",
        "            return 'unknown'\n",
        "\n",
        "    df['split'] = df['patient_id'].apply(assign_split)\n",
        "\n",
        "    # Create split DataFrames\n",
        "    train_df = df[df['split'] == 'train'].copy()\n",
        "    val_df = df[df['split'] == 'val'].copy()\n",
        "    test_df = df[df['split'] == 'test'].copy()\n",
        "\n",
        "    # CRITICAL VERIFICATION: Check for patient leakage\n",
        "    print(f\"\\n{'='*80}\")\n",
        "    print(\"LEAKAGE VERIFICATION\")\n",
        "    print(f\"{'='*80}\")\n",
        "\n",
        "    train_pts = set(train_df['patient_id'].unique())\n",
        "    val_pts = set(val_df['patient_id'].unique())\n",
        "    test_pts = set(test_df['patient_id'].unique())\n",
        "\n",
        "    overlap_train_val = train_pts & val_pts\n",
        "    overlap_train_test = train_pts & test_pts\n",
        "    overlap_val_test = val_pts & test_pts\n",
        "\n",
        "    print(f\"\\nPatient distribution:\")\n",
        "    print(f\"  Train: {len(train_pts)} patients ({len(train_pts)/len(patient_df)*100:.1f}%)\")\n",
        "    print(f\"  Val:   {len(val_pts)} patients ({len(val_pts)/len(patient_df)*100:.1f}%)\")\n",
        "    print(f\"  Test:  {len(test_pts)} patients ({len(test_pts)/len(patient_df)*100:.1f}%)\")\n",
        "\n",
        "    print(f\"\\nLeakage check:\")\n",
        "    if len(overlap_train_val) == 0:\n",
        "        print(f\"  ✓ Train-Val overlap: 0 patients (GOOD)\")\n",
        "    else:\n",
        "        print(f\"  ✗ Train-Val overlap: {len(overlap_train_val)} patients (DATA LEAKAGE!)\")\n",
        "\n",
        "    if len(overlap_train_test) == 0:\n",
        "        print(f\"  ✓ Train-Test overlap: 0 patients (GOOD)\")\n",
        "    else:\n",
        "        print(f\"  ✗ Train-Test overlap: {len(overlap_train_test)} patients (DATA LEAKAGE!)\")\n",
        "\n",
        "    if len(overlap_val_test) == 0:\n",
        "        print(f\"  ✓ Val-Test overlap: 0 patients (GOOD)\")\n",
        "    else:\n",
        "        print(f\"  ✗ Val-Test overlap: {len(overlap_val_test)} patients (DATA LEAKAGE!)\")\n",
        "\n",
        "    # Print split statistics\n",
        "    print(f\"\\n{'='*80}\")\n",
        "    print(\"SPLIT STATISTICS\")\n",
        "    print(f\"{'='*80}\")\n",
        "    print(f\"\\nSample distribution:\")\n",
        "    print(f\"  Train: {len(train_df)} samples ({len(train_df)/len(df)*100:.1f}%)\")\n",
        "    print(f\"  Val:   {len(val_df)} samples ({len(val_df)/len(df)*100:.1f}%)\")\n",
        "    print(f\"  Test:  {len(test_df)} samples ({len(test_df)/len(df)*100:.1f}%)\")\n",
        "\n",
        "    # Label distribution per split\n",
        "    print(f\"\\nLabel distribution per split:\")\n",
        "    print(\"-\" * 80)\n",
        "\n",
        "    all_labels = sorted(df['label'].unique())\n",
        "    split_stats = []\n",
        "\n",
        "    for label in all_labels:\n",
        "        train_count = (train_df['label'] == label).sum()\n",
        "        val_count = (val_df['label'] == label).sum()\n",
        "        test_count = (test_df['label'] == label).sum()\n",
        "        total_count = train_count + val_count + test_count\n",
        "\n",
        "        if total_count > 0:\n",
        "            split_stats.append({\n",
        "                'label': label,\n",
        "                'train': train_count,\n",
        "                'val': val_count,\n",
        "                'test': test_count,\n",
        "                'total': total_count\n",
        "            })\n",
        "\n",
        "    split_stats_df = pd.DataFrame(split_stats)\n",
        "    print(split_stats_df.to_string(index=False))\n",
        "\n",
        "    return train_df, val_df, test_df\n",
        "\n",
        "\n",
        "def save_splits_to_csv(\n",
        "    train_df: pd.DataFrame,\n",
        "    val_df: pd.DataFrame,\n",
        "    test_df: pd.DataFrame,\n",
        "    output_dir: str\n",
        "):\n",
        "    \"\"\"\n",
        "    Save train/val/test splits to CSV files.\n",
        "\n",
        "    Args:\n",
        "        train_df, val_df, test_df: DataFrames for each split\n",
        "        output_dir: Directory to save CSV files\n",
        "    \"\"\"\n",
        "    output_dir = Path(output_dir)\n",
        "    output_dir.mkdir(parents=True, exist_ok=True)\n",
        "\n",
        "    train_path = output_dir / 'train.csv'\n",
        "    val_path = output_dir / 'val.csv'\n",
        "    test_path = output_dir / 'test.csv'\n",
        "\n",
        "    train_df.to_csv(train_path, index=False)\n",
        "    val_df.to_csv(val_path, index=False)\n",
        "    test_df.to_csv(test_path, index=False)\n",
        "\n",
        "    print(f\"\\n{'='*80}\")\n",
        "    print(\"SAVED SPLITS TO CSV\")\n",
        "    print(f\"{'='*80}\")\n",
        "    print(f\"Train: {train_path} ({len(train_df)} samples)\")\n",
        "    print(f\"Val: {val_path} ({len(val_df)} samples)\")\n",
        "    print(f\"Test: {test_path} ({len(test_df)} samples)\")\n",
        "\n",
        "    # Also save combined file with split column\n",
        "    combined_df = pd.concat([train_df, val_df, test_df], ignore_index=True)\n",
        "    combined_path = output_dir / 'all_splits.csv'\n",
        "    combined_df.to_csv(combined_path, index=False)\n",
        "    print(f\"Combined: {combined_path} ({len(combined_df)} samples)\")\n",
        "\n",
        "    # Save metadata\n",
        "    metadata = {\n",
        "        'total_samples': len(combined_df),\n",
        "        'train_samples': len(train_df),\n",
        "        'val_samples': len(val_df),\n",
        "        'test_samples': len(test_df),\n",
        "        'train_patients': int(train_df['patient_id'].nunique()),\n",
        "        'val_patients': int(val_df['patient_id'].nunique()),\n",
        "        'test_patients': int(test_df['patient_id'].nunique()),\n",
        "        'num_classes': len(combined_df['label'].unique()),\n",
        "        'classes': sorted(combined_df['label'].unique()),\n",
        "        'class_distribution': combined_df['label'].value_counts().to_dict(),\n",
        "        'note': 'Patient-level split: NO patient appears in multiple splits'\n",
        "    }\n",
        "\n",
        "    metadata_path = output_dir / 'metadata.json'\n",
        "    with open(metadata_path, 'w') as f:\n",
        "        json.dump(metadata, f, indent=2)\n",
        "    print(f\"Metadata: {metadata_path}\")\n",
        "\n",
        "\n",
        "def create_and_save_splits(\n",
        "    root_dir: str,\n",
        "    output_dir: str,\n",
        "    train_ratio: float = 0.7,\n",
        "    val_ratio: float = 0.15,\n",
        "    test_ratio: float = 0.15,\n",
        "    random_state: int = 42,\n",
        "    consolidate_labels: bool = True,\n",
        "    min_samples_per_class: int = 10\n",
        "):\n",
        "    \"\"\"\n",
        "    Main function to collect all data and create patient-level splits.\n",
        "\n",
        "    IMPORTANT: This creates patient-level splits to prevent data leakage.\n",
        "    No patient will appear in multiple splits (train/val/test).\n",
        "\n",
        "    Args:\n",
        "        root_dir: Path to SPRSound dataset root\n",
        "        output_dir: Directory to save CSV splits\n",
        "        train_ratio: Proportion for training (default: 0.7)\n",
        "        val_ratio: Proportion for validation (default: 0.15)\n",
        "        test_ratio: Proportion for test (default: 0.15)\n",
        "        random_state: Random seed for reproducibility\n",
        "        consolidate_labels: Whether to consolidate rare labels\n",
        "        min_samples_per_class: Minimum samples for stratification\n",
        "    \"\"\"\n",
        "    # Collect all samples\n",
        "    all_df = collect_all_samples(root_dir, consolidate_labels=consolidate_labels)\n",
        "\n",
        "    # Create PATIENT-LEVEL stratified splits (FIXED!)\n",
        "    train_df, val_df, test_df = create_patient_level_splits(\n",
        "        all_df,\n",
        "        train_ratio=train_ratio,\n",
        "        val_ratio=val_ratio,\n",
        "        test_ratio=test_ratio,\n",
        "        random_state=random_state,\n",
        "        min_samples_per_class=min_samples_per_class\n",
        "    )\n",
        "\n",
        "    # Save to CSV\n",
        "    save_splits_to_csv(train_df, val_df, test_df, output_dir)\n",
        "\n",
        "    return train_df, val_df, test_df\n",
        "\n",
        "if __name__ == \"__main__\":\n",
        "  if split_data:\n",
        "    create_and_save_splits(root,root)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "9eYXVJ_blQDs"
      },
      "outputs": [],
      "source": [
        "\n",
        "# -----------------------\n",
        "# utils\n",
        "# -----------------------\n",
        "def _rand_uniform(a, b):\n",
        "    return a + (b - a) * random.random()\n",
        "\n",
        "\n",
        "def _rms(x: torch.Tensor):\n",
        "    return torch.sqrt(torch.mean(x * x) + 1e-8)\n",
        "\n",
        "\n",
        "# -----------------------\n",
        "# FAST room effect (no convolution)\n",
        "# -----------------------\n",
        "def _apply_fast_echo(wav: torch.Tensor, sr: int):\n",
        "    \"\"\"\n",
        "    Very cheap reverb-like effect using a few delayed taps.\n",
        "    O(N) time, no conv1d.\n",
        "    \"\"\"\n",
        "    y = wav.clone()\n",
        "    n = y.numel()\n",
        "\n",
        "    for _ in range(random.randint(2, 4)):\n",
        "        delay = int(_rand_uniform(0.01, 0.08) * sr)  # 10–80 ms\n",
        "        if delay <= 0 or delay >= n:\n",
        "            continue\n",
        "        gain = _rand_uniform(0.05, 0.25)\n",
        "        y[delay:] += gain * wav[:-delay]\n",
        "\n",
        "    # mild damping\n",
        "    y = 0.7 * y + 0.3 * torch.tanh(2.0 * y)\n",
        "    return y\n",
        "\n",
        "\n",
        "# -----------------------\n",
        "# FAST colored noise (no filters)\n",
        "# -----------------------\n",
        "def _colored_noise_fast(noise: torch.Tensor):\n",
        "    \"\"\"\n",
        "    Brown-ish noise via cumulative sum + optional high-pass differencing.\n",
        "    Pure tensor ops.\n",
        "    \"\"\"\n",
        "    n = torch.cumsum(noise, dim=0)\n",
        "    n = n / (n.std().clamp_min(1e-6))\n",
        "\n",
        "    if random.random() < 0.5:\n",
        "        n = torch.cat([n[:1], n[1:] - 0.98 * n[:-1]], dim=0)\n",
        "\n",
        "    return n\n",
        "\n",
        "\n",
        "def _add_noise_snr_fast(wav: torch.Tensor, snr_db_range=(3, 25)):\n",
        "    snr_db = _rand_uniform(*snr_db_range)\n",
        "    noise = torch.randn_like(wav)\n",
        "    noise = _colored_noise_fast(noise)\n",
        "\n",
        "    sig_rms = _rms(wav)\n",
        "    noise_rms = _rms(noise)\n",
        "    target_noise_rms = sig_rms / (10 ** (snr_db / 20))\n",
        "    noise = noise * (target_noise_rms / (noise_rms + 1e-8))\n",
        "\n",
        "    return wav + noise\n",
        "\n",
        "\n",
        "# -----------------------\n",
        "# FAST phone band-limiting EQ (2 biquads max)\n",
        "# -----------------------\n",
        "def _phone_bandlimit_fast(wav: torch.Tensor, sr: int):\n",
        "    hp = random.choice([120, 150, 200])\n",
        "    lp = random.choice([4000, 6000, 8000])\n",
        "\n",
        "    y = torchaudio.functional.highpass_biquad(wav, sr, hp)\n",
        "    y = torchaudio.functional.lowpass_biquad(y, sr, lp)\n",
        "    return y\n",
        "\n",
        "\n",
        "# -----------------------\n",
        "# AGC-like soft compression\n",
        "# -----------------------\n",
        "def _soft_agc(wav: torch.Tensor):\n",
        "    gain_db = _rand_uniform(-6, 12)\n",
        "    gain = 10 ** (gain_db / 20)\n",
        "    y = wav * gain\n",
        "\n",
        "    drive = _rand_uniform(1.5, 3.5)\n",
        "    y = torch.tanh(drive * y)\n",
        "\n",
        "    return y\n",
        "\n",
        "\n",
        "# -----------------------\n",
        "# Misc cheap ops\n",
        "# -----------------------\n",
        "def _random_gain(wav: torch.Tensor, db_range=(-18, 8)):\n",
        "    g = 10 ** (_rand_uniform(*db_range) / 20)\n",
        "    return wav * g\n",
        "\n",
        "\n",
        "def _random_time_shift(wav: torch.Tensor, sr: int, max_s=0.08):\n",
        "    max_shift = int(max_s * sr)\n",
        "    if max_shift <= 0:\n",
        "        return wav\n",
        "    shift = random.randint(-max_shift, max_shift)\n",
        "    return torch.roll(wav, shifts=shift)\n",
        "\n",
        "\n",
        "def _random_clipping(wav: torch.Tensor, p=0.15):\n",
        "    if random.random() > p:\n",
        "        return wav\n",
        "    clip = _rand_uniform(0.3, 0.9)\n",
        "    return torch.clamp(wav, -clip, clip)\n",
        "\n",
        "\n",
        "# -----------------------\n",
        "# MAIN AUGMENT CLASS\n",
        "# -----------------------\n",
        "class PhoneLikeAugment:\n",
        "    \"\"\"\n",
        "    Fast phone-mic simulation for stethoscope → phone domain shift.\n",
        "    Designed for DataLoader safety + speed.\n",
        "    \"\"\"\n",
        "\n",
        "    def __init__(self, sr=16000, p=0.5):\n",
        "        self.sr = sr\n",
        "        self.p = p\n",
        "\n",
        "    def __call__(self, wav: torch.Tensor):\n",
        "        if random.random() > self.p:\n",
        "            return wav\n",
        "\n",
        "        y = wav\n",
        "\n",
        "        # small timing jitter\n",
        "        if random.random() < 0.4:\n",
        "            y = _random_time_shift(y, self.sr)\n",
        "\n",
        "        # distance / level\n",
        "        y = _random_gain(y)\n",
        "\n",
        "        # phone band-limiting\n",
        "        if random.random() < 0.9:\n",
        "            y = _phone_bandlimit_fast(y, self.sr)\n",
        "\n",
        "        # cheap room effect\n",
        "        if random.random() < 0.15:\n",
        "            y = _apply_fast_echo(y, self.sr)\n",
        "\n",
        "        # noise\n",
        "        if random.random() < 0.8:\n",
        "            y = _add_noise_snr_fast(y)\n",
        "\n",
        "        # AGC\n",
        "        if random.random() < 0.7:\n",
        "            y = _soft_agc(y)\n",
        "\n",
        "        # rare clipping\n",
        "        y = _random_clipping(y)\n",
        "\n",
        "        # final normalization\n",
        "        peak = y.abs().max().clamp_min(1e-6)\n",
        "        y = y / peak * _rand_uniform(0.3, 1.0)\n",
        "\n",
        "        return y"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "7teh4Wk1Z75R"
      },
      "outputs": [],
      "source": [
        "##########################DataSet###########################\n",
        "class SPRSoundDataset(Dataset):\n",
        "    \"\"\"\n",
        "    Dataset class for SPRSound that loads from pre-split CSV files.\n",
        "\n",
        "    HeAR expects 16kHz audio in 2-second chunks (32,000 samples).\n",
        "    For recordings longer than 2s, we chunk into non-overlapping 2s windows,\n",
        "    run preprocess_audio on each chunk, and stack them so the model can\n",
        "    aggregate (mean-pool) the per-chunk embeddings.\n",
        "\n",
        "    For recordings shorter than 2s, preprocess_audio zero-pads internally.\n",
        "\n",
        "    Args:\n",
        "        csv_path: Path to CSV file (train.csv, val.csv, or test.csv)\n",
        "        target_sr: Target sample rate — MUST be 16000 to match HeAR\n",
        "        max_duration: Maximum audio duration in seconds to keep (default: 10)\n",
        "        apply_hear_preprocess: Whether to apply HEAR preprocessing (default: True)\n",
        "    \"\"\"\n",
        "\n",
        "    # HeAR's fixed contract: 2 seconds at 16 kHz\n",
        "    HEAR_SR = 16000\n",
        "    HEAR_CHUNK_SAMPLES = 32000  # 2s * 16kHz\n",
        "\n",
        "    def __init__(\n",
        "        self,\n",
        "        csv_path: str,\n",
        "        target_sr: int = 16000,\n",
        "        max_duration: float = 10.0,\n",
        "        apply_hear_preprocess: bool = True,\n",
        "        class_to_idx=None,\n",
        "        is_train=False\n",
        "    ):\n",
        "        self.csv_path = Path(csv_path)\n",
        "        self.target_sr = target_sr\n",
        "        self.max_duration = max_duration\n",
        "        self.max_samples = int(target_sr * max_duration)\n",
        "        self.apply_hear_preprocess = apply_hear_preprocess\n",
        "\n",
        "        self.augment = PhoneLikeAugment(sr=self.target_sr, p=0.5) if is_train else None\n",
        "        self._resamplers = {}\n",
        "\n",
        "        self.class_to_idx = dict(class_to_idx)\n",
        "        self.idx_to_class = {v: k for k, v in self.class_to_idx.items()}\n",
        "\n",
        "        assert self.target_sr == self.HEAR_SR, (\n",
        "            f\"target_sr must be {self.HEAR_SR} to match HeAR preprocessing. \"\n",
        "            f\"Got {self.target_sr}. Resampling from native SR to 16kHz is \"\n",
        "            f\"handled automatically in _load_audio().\"\n",
        "        )\n",
        "\n",
        "        # Import HEAR preprocessing if needed\n",
        "        if apply_hear_preprocess:\n",
        "            audio_utils = importlib.import_module(\n",
        "                \"hear.python.data_processing.audio_utils\"\n",
        "            )\n",
        "            self.preprocess_audio = audio_utils.preprocess_audio\n",
        "\n",
        "        # Load CSV\n",
        "        self.df = pd.read_csv(csv_path)\n",
        "        self.df[\"label\"] = self.df[\"label\"].apply(\n",
        "            lambda x: \"normal\" if x == \"normal\" else \"abnormal\"\n",
        "        )\n",
        "        \"\"\"\n",
        "        # Build class mapping from all unique labels\n",
        "        all_labels = sorted(self.df['label'].unique())\n",
        "        self.class_to_idx = {label: idx for idx, label in enumerate(all_labels)}\n",
        "        self.idx_to_class = {v: k for k, v in self.class_to_idx.items()}\n",
        "        \"\"\"\n",
        "        split_name = self.csv_path.stem\n",
        "        print(f\"Loaded {len(self.df)} samples from {csv_path}\")\n",
        "        print(f\"Split: {split_name}\")\n",
        "        print(f\"Target SR: {self.target_sr} Hz (HeAR native)\")\n",
        "        print(f\"Number of classes: {len(self.class_to_idx)}\")\n",
        "        self._print_statistics()\n",
        "\n",
        "    def _print_statistics(self):\n",
        "        \"\"\"Print dataset statistics\"\"\"\n",
        "        label_counts = self.df['label'].value_counts()\n",
        "\n",
        "        print(f\"\\nClass distribution:\")\n",
        "        for label in sorted(label_counts.index):\n",
        "            count = label_counts[label]\n",
        "            percentage = count / len(self.df) * 100\n",
        "            class_idx = self.class_to_idx.get(label, '?')\n",
        "            print(f\"  [{class_idx:2d}] {label:20s}: {count:5d} ({percentage:5.2f}%)\")\n",
        "\n",
        "    def _load_audio(self, audio_path: str):\n",
        "        \"\"\"\n",
        "        Load audio, convert to mono, resample to 16 kHz, and truncate\n",
        "        to max_duration. Does NOT pad to a fixed length — chunking\n",
        "        handles variable lengths.\n",
        "        \"\"\"\n",
        "        waveform, sr = torchaudio.load(audio_path)\n",
        "\n",
        "        # Convert to mono if stereo\n",
        "        if waveform.shape[0] > 1:\n",
        "            waveform = torch.mean(waveform, dim=0, keepdim=True)\n",
        "\n",
        "        # Resample to 16 kHz (from 8 kHz or whatever native SR)\n",
        "        if sr != self.target_sr:\n",
        "            if sr not in self._resamplers:\n",
        "                self._resamplers[sr] = torchaudio.transforms.Resample(sr, self.target_sr)\n",
        "            waveform = self._resamplers[sr](waveform)\n",
        "\n",
        "\n",
        "        # Remove channel dimension → [samples]\n",
        "        waveform = waveform.squeeze(0)\n",
        "\n",
        "        # Truncate to max_duration (but don't pad — chunking handles short clips)\n",
        "        if waveform.shape[0] > self.max_samples:\n",
        "            waveform = waveform[:self.max_samples]\n",
        "\n",
        "        return waveform\n",
        "\n",
        "    def _chunk_and_preprocess(self, waveform: torch.Tensor) -> torch.Tensor:\n",
        "        \"\"\"\n",
        "        Split waveform into non-overlapping 2-second chunks, run HeAR's\n",
        "        preprocess_audio on each, and stack the resulting spectrograms.\n",
        "\n",
        "        For audio shorter than 2s, preprocess_audio handles zero-padding.\n",
        "        The last chunk is zero-padded if it doesn't fill a full 2s window.\n",
        "\n",
        "        Returns:\n",
        "            Tensor of shape [num_chunks, 1, 192, 128]\n",
        "        \"\"\"\n",
        "        chunk_size = self.HEAR_CHUNK_SAMPLES\n",
        "        total_samples = waveform.shape[0]\n",
        "\n",
        "        # Calculate number of chunks (ceiling division — last chunk gets padded)\n",
        "        num_chunks = max(1, math.ceil(total_samples / chunk_size))\n",
        "\n",
        "        chunks = []\n",
        "        for i in range(num_chunks):\n",
        "            start = i * chunk_size\n",
        "            end = min(start + chunk_size, total_samples)\n",
        "            chunk = waveform[start:end]\n",
        "\n",
        "            # Zero-pad last chunk if needed (preprocess_audio also pads, but\n",
        "            # let's be explicit and give it exactly 32000 samples)\n",
        "            if chunk.shape[0] < chunk_size:\n",
        "\n",
        "                chunk = torch.nn.functional.pad(\n",
        "                    chunk, (0, chunk_size - chunk.shape[0])\n",
        "                )\n",
        "\n",
        "\n",
        "            chunks.append(chunk)\n",
        "\n",
        "        # Stack chunks into a batch: [num_chunks, 32000]\n",
        "\n",
        "        chunk_batch = torch.stack(chunks, dim=0)\n",
        "\n",
        "        # Run HeAR preprocessing on the whole batch at once\n",
        "        # preprocess_audio expects [batch, 32000] → returns [batch, 1, 192, 128]\n",
        "\n",
        "        spectrograms = self.preprocess_audio(chunk_batch)\n",
        "        spectrograms = spectrograms.clamp(max=3.0)\n",
        "\n",
        "        return spectrograms\n",
        "\n",
        "    def __len__(self):\n",
        "        return len(self.df)\n",
        "\n",
        "    def __getitem__(self, idx):\n",
        "        row = self.df.iloc[idx]\n",
        "\n",
        "        waveform = self._load_audio(row['wav_path'])\n",
        "\n",
        "        if self.augment is not None:\n",
        "            waveform = self.augment(waveform)\n",
        "\n",
        "        if self.apply_hear_preprocess:\n",
        "            # [T, 1, 192, 128]\n",
        "            chunk_spectrograms = self._chunk_and_preprocess(waveform)\n",
        "\n",
        "            features = chunk_spectrograms\n",
        "            length = chunk_spectrograms.shape[0]\n",
        "        else:\n",
        "\n",
        "            features = waveform.unsqueeze(0)  # [1, samples]\n",
        "            length = 1\n",
        "\n",
        "        label = self.class_to_idx[row['label']]\n",
        "        event_types = row['event_types'].split('|') if pd.notna(row['event_types']) and row['event_types'] else []\n",
        "\n",
        "        return {\n",
        "            'features': features,      # [T, 1, 192, 128]\n",
        "            'length': length,          # int\n",
        "            'label': label,\n",
        "            'filename': row['filename'],\n",
        "            'event_types': event_types,\n",
        "            'year': row['year'],\n",
        "            'original_split': row['original_split'],\n",
        "            'original_label': row.get('original_label', row['label'])\n",
        "        }\n",
        "\n",
        "\n",
        "    def get_class_weights(self, method='inverse'):\n",
        "        \"\"\"Calculate class weights for handling imbalanced data\"\"\"\n",
        "        import torch\n",
        "\n",
        "        label_counts = Counter(self.df['label'])\n",
        "\n",
        "        total = len(self.df)\n",
        "        num_classes = len(self.class_to_idx)\n",
        "\n",
        "        if method == 'inverse':\n",
        "            weights = {}\n",
        "            for label, count in label_counts.items():\n",
        "                weights[self.class_to_idx[label]] = total / (num_classes * count)\n",
        "\n",
        "        elif method == 'effective':\n",
        "            beta = 0.9999\n",
        "            weights = {}\n",
        "            for label, count in label_counts.items():\n",
        "                effective_num = 1.0 - (beta ** count)\n",
        "                weights[self.class_to_idx[label]] = (1.0 - beta) / effective_num\n",
        "\n",
        "        else:\n",
        "            raise ValueError(f\"Unknown method: {method}\")\n",
        "\n",
        "        # Convert to tensor\n",
        "        weight_tensor = torch.zeros(num_classes)\n",
        "        for idx, weight in weights.items():\n",
        "            weight_tensor[idx] = weight\n",
        "\n",
        "        return weight_tensor\n",
        "def collate_respiratory_batch(batch):\n",
        "    # batch[i]['features'] is [T, 1, 192, 128]\n",
        "    lengths = torch.tensor([item['length'] for item in batch], dtype=torch.long)\n",
        "    max_len = int(lengths.max().item())\n",
        "\n",
        "    # infer feature shape\n",
        "    _, C, H, W = batch[0]['features'].shape\n",
        "\n",
        "    padded = torch.zeros(len(batch), max_len, C, H, W, dtype=batch[0]['features'].dtype)\n",
        "    for i, item in enumerate(batch):\n",
        "        T = item['features'].shape[0]\n",
        "        padded[i, :T] = item['features']\n",
        "\n",
        "    labels = torch.tensor([item['label'] for item in batch], dtype=torch.long)\n",
        "    filenames = [item['filename'] for item in batch]\n",
        "    event_types = [item['event_types'] for item in batch]\n",
        "    years = [item['year'] for item in batch]\n",
        "    original_splits = [item['original_split'] for item in batch]\n",
        "    original_labels = [item['original_label'] for item in batch]\n",
        "\n",
        "    return {\n",
        "        'features': padded,        # [B, T_max, 1, 192, 128]\n",
        "        'lengths': lengths,        # [B]\n",
        "        'label': labels,\n",
        "        'filename': filenames,\n",
        "        'event_types': event_types,\n",
        "        'year': years,\n",
        "        'original_split': original_splits,\n",
        "        'original_label': original_labels\n",
        "    }\n",
        "def visualize_spectrograms_by_class(dataset, class_names, num_samples_per_class=2, save_path=None):\n",
        "    \"\"\"\n",
        "    Visualize spectrogram samples from each class.\n",
        "\n",
        "    Args:\n",
        "        dataset: The dataset object (SPRSoundDataset)\n",
        "        class_names: List of class names\n",
        "        num_samples_per_class: Number of samples to visualize per class (default: 2)\n",
        "        save_path: Optional path to save the visualization\n",
        "    \"\"\"\n",
        "    # Collect indices for each class\n",
        "    class_indices = {i: [] for i in range(len(class_names))}\n",
        "\n",
        "    print(\"Collecting samples from each class...\")\n",
        "    for idx in range(len(dataset)):\n",
        "        label = dataset.df.iloc[idx]['label']\n",
        "        label=dataset.class_to_idx[label]\n",
        "        if len(class_indices[label]) < num_samples_per_class:\n",
        "            class_indices[label].append(idx)\n",
        "\n",
        "        # Stop if we have enough samples for all classes\n",
        "        if all(len(indices) >= num_samples_per_class for indices in class_indices.values()):\n",
        "            break\n",
        "\n",
        "    # Check if we have enough samples for each class\n",
        "    for class_idx, indices in class_indices.items():\n",
        "        if len(indices) < num_samples_per_class:\n",
        "            print(f\"Warning: Only found {len(indices)} samples for class '{class_names[class_idx]}'\")\n",
        "\n",
        "    # Create the visualization\n",
        "    num_classes = len(class_names)\n",
        "    fig, axes = plt.subplots(num_classes, num_samples_per_class,\n",
        "                             figsize=(5*num_samples_per_class, 4*num_classes))\n",
        "\n",
        "    # Handle case where we only have 1 sample per class\n",
        "    if num_samples_per_class == 1:\n",
        "        axes = axes.reshape(-1, 1)\n",
        "\n",
        "    print(\"\\nGenerating spectrograms...\")\n",
        "    for class_idx in range(num_classes):\n",
        "        indices = class_indices[class_idx]\n",
        "\n",
        "        for sample_idx, data_idx in enumerate(indices[:num_samples_per_class]):\n",
        "            # Get the data sample\n",
        "            sample = dataset[data_idx]\n",
        "            spectrogram = sample['features']  # Shape: [time, freq] or [freq, time]\n",
        "            filename = sample['filename']\n",
        "\n",
        "            # Convert to numpy if tensor\n",
        "            if torch.is_tensor(spectrogram):\n",
        "                spec_np = spectrogram.cpu().numpy()\n",
        "            else:\n",
        "                spec_np = spectrogram\n",
        "            # Handle 4D tensor: [T, 1, 192, 128]\n",
        "            if len(spec_np.shape) == 4:\n",
        "                spec_np = spec_np[0, 0, :, :]  # Shape: [192, 128] (freq, time)\n",
        "            elif len(spec_np.shape) == 3:\n",
        "                spec_np = spec_np[0, :, :]  # Shape: [192, 128]\n",
        "            # Plot the spectrogram\n",
        "            ax = axes[class_idx, sample_idx]\n",
        "\n",
        "            # Transpose if needed for correct orientation (frequency on y-axis)\n",
        "            if spec_np.shape[0] > spec_np.shape[1]:\n",
        "                spec_np = spec_np.T\n",
        "\n",
        "            im = ax.imshow(spec_np, aspect='auto', origin='lower', cmap='viridis')\n",
        "\n",
        "            # Set title with class name and filename\n",
        "            if sample_idx == 0:\n",
        "                ax.set_ylabel(f\"{class_names[class_idx]}\\n({filename})\",\n",
        "                             fontsize=10, fontweight='bold')\n",
        "            else:\n",
        "                ax.set_ylabel(filename, fontsize=8)\n",
        "\n",
        "            ax.set_xlabel('Time')\n",
        "            if sample_idx == 0:\n",
        "                ax.set_ylabel(f\"{class_names[class_idx]}\\nFrequency\", fontsize=10)\n",
        "            else:\n",
        "                ax.set_ylabel('Frequency', fontsize=8)\n",
        "\n",
        "            ax.set_title(f\"Sample {sample_idx+1}\", fontsize=9)\n",
        "\n",
        "            # Add colorbar\n",
        "            plt.colorbar(im, ax=ax, fraction=0.046, pad=0.04)\n",
        "\n",
        "    plt.suptitle('Spectrogram Samples by Class', fontsize=14, fontweight='bold', y=0.995)\n",
        "    plt.tight_layout()\n",
        "\n",
        "    if save_path:\n",
        "        os.makedirs(os.path.dirname(save_path), exist_ok=True)\n",
        "        plt.savefig(save_path, dpi=150, bbox_inches='tight')\n",
        "        print(f\"\\nVisualization saved to: {save_path}\")\n",
        "\n",
        "    plt.show()\n",
        "\n",
        "    return fig\n",
        "\n",
        "def quick_visualize_spectrograms(trainer):\n",
        "    \"\"\"\n",
        "    Quick function to visualize spectrograms from the trainer object.\n",
        "\n",
        "    Args:\n",
        "        trainer: RespiratoryTrainer object (already initialized)\n",
        "    \"\"\"\n",
        "    import matplotlib.pyplot as plt\n",
        "    import os\n",
        "\n",
        "    print(\"\\n\" + \"=\"*80)\n",
        "    print(\"VISUALIZING SPECTROGRAMS\")\n",
        "    print(\"=\"*80)\n",
        "\n",
        "    # Create output directory\n",
        "    output_dir = os.path.join(trainer.configs[\"logdir\"], \"figures\")\n",
        "    os.makedirs(output_dir, exist_ok=True)\n",
        "\n",
        "    # Visualize training spectrograms\n",
        "    print(\"\\nVisualizing TRAINING set...\")\n",
        "    train_save_path = os.path.join(output_dir, \"spectrograms_train.png\")\n",
        "    visualize_spectrograms_by_class(\n",
        "        dataset=trainer.train_dataset,\n",
        "        class_names=trainer.class_names,\n",
        "        num_samples_per_class=2,\n",
        "        save_path=train_save_path\n",
        "    )\n",
        "\n",
        "    # Visualize validation spectrograms\n",
        "    print(\"\\nVisualizing VALIDATION set...\")\n",
        "    val_save_path = os.path.join(output_dir, \"spectrograms_val.png\")\n",
        "    visualize_spectrograms_by_class(\n",
        "        dataset=trainer.val_dataset,\n",
        "        class_names=trainer.class_names,\n",
        "        num_samples_per_class=2,\n",
        "        save_path=val_save_path\n",
        "    )\n",
        "\n",
        "    print(\"\\n\" + \"=\"*80)\n",
        "    print(\"VISUALIZATION COMPLETE!\")\n",
        "    print(\"=\"*80)\n",
        "    print(f\"Training spectrograms: {train_save_path}\")\n",
        "    print(f\"Validation spectrograms: {val_save_path}\")\n",
        "\n",
        "\n",
        "def create_dataloaders_from_csv(\n",
        "    csv_dir: str,\n",
        "    batch_size: int = 16,\n",
        "    num_workers: int = 2\n",
        "):\n",
        "    \"\"\"\n",
        "    Create dataloaders from CSV files.\n",
        "\n",
        "    Args:\n",
        "        csv_dir: Directory containing train.csv, val.csv, test.csv\n",
        "        batch_size: Batch size\n",
        "        num_workers: Number of data loading workers\n",
        "    \"\"\"\n",
        "\n",
        "    csv_dir = Path(csv_dir)\n",
        "\n",
        "    CANONICAL_CLASSES = [\"normal\", \"abnormal\"]\n",
        "    CLASS_TO_IDX = {c: i for i, c in enumerate(CANONICAL_CLASSES)}\n",
        "    IDX_TO_CLASS = {i: c for c, i in CLASS_TO_IDX.items()}\n",
        "\n",
        "\n",
        "    # Create datasets\n",
        "    train_dataset = SPRSoundDataset(\n",
        "        csv_path=csv_dir / 'train.csv',\n",
        "        target_sr=16000 ,\n",
        "        max_duration=10.0,\n",
        "        apply_hear_preprocess=True,\n",
        "        class_to_idx=CLASS_TO_IDX,\n",
        "        is_train=True\n",
        "    )\n",
        "\n",
        "    val_dataset = SPRSoundDataset(\n",
        "        csv_path=csv_dir / 'val.csv',\n",
        "        target_sr=16000 ,\n",
        "        max_duration=10.0,\n",
        "        apply_hear_preprocess=True,\n",
        "        class_to_idx=CLASS_TO_IDX\n",
        "    )\n",
        "\n",
        "    test_dataset = SPRSoundDataset(\n",
        "        csv_path=csv_dir / 'test.csv',\n",
        "        target_sr=16000 ,\n",
        "        max_duration=10.0,\n",
        "        apply_hear_preprocess=True,\n",
        "        class_to_idx=CLASS_TO_IDX\n",
        "    )\n",
        "    print(\"\\n=== CLASS MAP CHECK ===\")\n",
        "    print(\"Train:\", train_dataset.class_to_idx)\n",
        "    print(\"Val:  \", val_dataset.class_to_idx)\n",
        "    print(\"Test: \", test_dataset.class_to_idx)\n",
        "\n",
        "    # Strict equality checks\n",
        "    print(\"train == val ?\", train_dataset.class_to_idx == val_dataset.class_to_idx)\n",
        "    print(\"train == test?\", train_dataset.class_to_idx == test_dataset.class_to_idx)\n",
        "\n",
        "    class_weights = train_dataset.get_class_weights()\n",
        "    label_indices = [train_dataset.class_to_idx[label] for label in train_dataset.df['label']]\n",
        "    sample_weights = [class_weights[idx].item() for idx in label_indices]\n",
        "    sampler = WeightedRandomSampler(\n",
        "        weights=sample_weights,\n",
        "        num_samples=len(sample_weights),\n",
        "        replacement=True\n",
        "    )\n",
        "    # Create dataloaders\n",
        "    train_loader = DataLoader(\n",
        "        train_dataset,\n",
        "        batch_size=batch_size,\n",
        "        sampler=sampler,\n",
        "        num_workers=num_workers,\n",
        "        pin_memory=True,\n",
        "        persistent_workers=True if num_workers > 0 else False,\n",
        "        collate_fn=collate_respiratory_batch\n",
        "    )\n",
        "\n",
        "    val_loader = DataLoader(\n",
        "        val_dataset,\n",
        "        batch_size=batch_size,\n",
        "        shuffle=False,\n",
        "        num_workers=num_workers,\n",
        "        pin_memory=True,\n",
        "        persistent_workers=True if num_workers > 0 else False,\n",
        "        collate_fn=collate_respiratory_batch\n",
        "    )\n",
        "\n",
        "    test_loader = DataLoader(\n",
        "        test_dataset,\n",
        "        batch_size=batch_size,\n",
        "        shuffle=False,\n",
        "        num_workers=num_workers,\n",
        "        pin_memory=True,\n",
        "        persistent_workers=True if num_workers > 0 else False,\n",
        "        collate_fn=collate_respiratory_batch\n",
        "    )\n",
        "\n",
        "    print(f\"\\n{'='*80}\")\n",
        "    print(\"DATALOADERS CREATED\")\n",
        "    print(f\"{'='*80}\")\n",
        "    print(f\"Train batches: {len(train_loader)}\")\n",
        "    print(f\"Val batches: {len(val_loader)}\")\n",
        "    print(f\"Test batches: {len(test_loader)}\")\n",
        "\n",
        "    return train_loader, val_loader, test_loader, class_weights, train_dataset\n",
        "\n",
        "# train_loader, val_loader, test_loader, class_weights, train_dataset=create_dataloaders_from_csv(root)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "MTXCmo5vquAU"
      },
      "outputs": [],
      "source": [
        "####### Model #######\n",
        "class GatedAttentionPool(nn.Module):\n",
        "    def __init__(self, dim: int, attn_hidden: int = 128, dropout: float = 0.2):\n",
        "        super().__init__()\n",
        "        self.V = nn.Sequential(\n",
        "            nn.LayerNorm(dim),\n",
        "            nn.Dropout(dropout),\n",
        "            nn.Linear(dim, attn_hidden)\n",
        "        )\n",
        "        self.U = nn.Sequential(\n",
        "            nn.LayerNorm(dim),\n",
        "            nn.Dropout(dropout),\n",
        "            nn.Linear(dim, attn_hidden)\n",
        "        )\n",
        "        self.w = nn.Linear(attn_hidden, 1)\n",
        "\n",
        "    def forward(self, x, lengths):\n",
        "        # x: [B,T,D]\n",
        "        Vx = self.V(x)  # [B,T,H]\n",
        "        Ux = self.U(x)  # [B,T,H]\n",
        "        scores = self.w(Vx * Ux).squeeze(-1)  # [B,T]\n",
        "\n",
        "        # Create mask\n",
        "        idxs = torch.arange(x.size(1), device=x.device).unsqueeze(0)\n",
        "        mask = idxs >= lengths.unsqueeze(1)\n",
        "        scores = scores.masked_fill(mask, float(\"-inf\"))\n",
        "\n",
        "        # Attention weights\n",
        "        attn = torch.softmax(scores, dim=1)\n",
        "\n",
        "        # Weighted pooling\n",
        "        pooled = torch.sum(x * attn.unsqueeze(-1), dim=1)\n",
        "\n",
        "        return pooled, attn\n",
        "\n",
        "class LoRALinear(nn.Module):\n",
        "    \"\"\"\n",
        "    Wraps an existing nn.Linear layer with LoRA:\n",
        "      y = xW^T + b + scale * x(BA)^T\n",
        "    \"\"\"\n",
        "    def __init__(self, base_linear: nn.Linear, r: int = 8, alpha: int = 16, dropout: float = 0.0):\n",
        "        super().__init__()\n",
        "        assert isinstance(base_linear, nn.Linear)\n",
        "        self.base = base_linear\n",
        "        self.in_features = base_linear.in_features\n",
        "        self.out_features = base_linear.out_features\n",
        "\n",
        "        self.r = r\n",
        "        self.alpha = alpha\n",
        "        self.scale = alpha / r if r > 0 else 1.0\n",
        "        self.lora_dropout = nn.Dropout(dropout) if dropout > 0 else nn.Identity()\n",
        "\n",
        "        # Freeze base weights\n",
        "        self.base.weight.requires_grad = False\n",
        "        if self.base.bias is not None:\n",
        "            self.base.bias.requires_grad = False\n",
        "\n",
        "        # LoRA params\n",
        "        if r > 0:\n",
        "            self.lora_A = nn.Parameter(torch.zeros(r, self.in_features))\n",
        "            self.lora_B = nn.Parameter(torch.zeros(self.out_features, r))\n",
        "\n",
        "            # Init: A small random, B zeros => start as no-op\n",
        "            nn.init.kaiming_uniform_(self.lora_A, a=math.sqrt(5))\n",
        "            nn.init.zeros_(self.lora_B)\n",
        "        else:\n",
        "            self.register_parameter(\"lora_A\", None)\n",
        "            self.register_parameter(\"lora_B\", None)\n",
        "\n",
        "    def forward(self, x):\n",
        "        y = self.base(x)\n",
        "        if self.r > 0:\n",
        "            x_d = self.lora_dropout(x)\n",
        "            # (x @ A^T) @ B^T\n",
        "            lora = (x_d @ self.lora_A.t()) @ self.lora_B.t()\n",
        "            y = y + self.scale * lora\n",
        "        return y\n",
        "\n",
        "    @staticmethod\n",
        "    def apply_lora_to_hear_vit(\n",
        "        hear_model: nn.Module,\n",
        "        r: int = 8,\n",
        "        alpha: int = 16,\n",
        "        dropout: float = 0.05,\n",
        "        last_n_blocks: int = 2,\n",
        "        target_modules: list = None  # ['query', 'key', 'value'] or ['query', 'value']\n",
        "    ):\n",
        "        \"\"\"\n",
        "        Applies LoRA to HeAR model (Hugging Face ViT architecture).\n",
        "\n",
        "        HeAR Structure:\n",
        "        - hear_model.encoder.layer[i] = transformer blocks\n",
        "        - hear_model.encoder.layer[i].attention.attention.query/key/value = Linear layers\n",
        "\n",
        "        Args:\n",
        "            hear_model: HeAR model from transformers\n",
        "            r: LoRA rank\n",
        "            alpha: LoRA alpha (scaling)\n",
        "            dropout: LoRA dropout\n",
        "            last_n_blocks: Apply LoRA to last N blocks\n",
        "            target_modules: Which attention projections to apply LoRA to\n",
        "                          ['query', 'key', 'value'] or subset like ['query', 'value']\n",
        "        \"\"\"\n",
        "        if target_modules is None:\n",
        "            target_modules = ['query','key', 'value']  # Common choice, skip 'key'\n",
        "\n",
        "        # Freeze everything first\n",
        "        for p in hear_model.parameters():\n",
        "            p.requires_grad = False\n",
        "\n",
        "        # Access transformer blocks\n",
        "        # HuggingFace ViT: model.encoder.layer is ModuleList of ViTLayer\n",
        "        if not hasattr(hear_model, 'encoder'):\n",
        "            raise ValueError(\"Expected HeAR model with .encoder attribute\")\n",
        "\n",
        "        layers = hear_model.encoder.layer\n",
        "        start = max(0, len(layers) - last_n_blocks)\n",
        "\n",
        "        patched = 0\n",
        "        for i in range(start, len(layers)):\n",
        "            layer = layers[i]\n",
        "\n",
        "            # HuggingFace ViT attention structure:\n",
        "            # layer.attention.attention.query/key/value\n",
        "            if hasattr(layer, 'attention') and hasattr(layer.attention, 'attention'):\n",
        "                attn = layer.attention.attention\n",
        "\n",
        "                # Apply LoRA to specified modules\n",
        "                if 'query' in target_modules and isinstance(attn.query, nn.Linear):\n",
        "                    attn.query = LoRALinear(attn.query, r=r, alpha=alpha, dropout=dropout)\n",
        "                    patched += 1\n",
        "\n",
        "                if 'key' in target_modules and isinstance(attn.key, nn.Linear):\n",
        "                    attn.key = LoRALinear(attn.key, r=r, alpha=alpha, dropout=dropout)\n",
        "                    patched += 1\n",
        "\n",
        "                if 'value' in target_modules and isinstance(attn.value, nn.Linear):\n",
        "                    attn.value = LoRALinear(attn.value, r=r, alpha=alpha, dropout=dropout)\n",
        "                    patched += 1\n",
        "\n",
        "            # Make LayerNorm trainable in those blocks\n",
        "            for name, m in layer.named_modules():\n",
        "                if isinstance(m, nn.LayerNorm):\n",
        "                    for p in m.parameters():\n",
        "                        p.requires_grad = True\n",
        "\n",
        "        # Make final LayerNorm trainable\n",
        "        if hasattr(hear_model, 'layernorm') and isinstance(hear_model.layernorm, nn.LayerNorm):\n",
        "            for p in hear_model.layernorm.parameters():\n",
        "                p.requires_grad = True\n",
        "\n",
        "        print(f\"✓ LoRA applied to {patched} attention projections in last {last_n_blocks} blocks\")\n",
        "        print(f\"  Target modules: {target_modules}\")\n",
        "        print(f\"  LoRA rank: {r}, alpha: {alpha}, dropout: {dropout}\")\n",
        "\n",
        "        return hear_model\n",
        "\n",
        "class AdaptiveRespiratoryModel(nn.Module):\n",
        "    def __init__(\n",
        "        self,\n",
        "        num_classes: int = 2,\n",
        "        dropout: float = 0.4,\n",
        "        use_lora: bool = True,\n",
        "        lora_r: int = 8,\n",
        "        lora_alpha: int = 16,\n",
        "        lora_dropout: float = 0.05,\n",
        "        lora_last_n_blocks: int = 2,\n",
        "        rnn_hidden: int = 512,\n",
        "        rnn_layers: int = 2,\n",
        "    ):\n",
        "        super().__init__()\n",
        "\n",
        "        # Load HeAR backbone\n",
        "        self.hear = AutoModel.from_pretrained(\n",
        "            \"google/hear-pytorch\",\n",
        "            trust_remote_code=True\n",
        "        )\n",
        "\n",
        "        # Apply LoRA if requested\n",
        "        if use_lora:\n",
        "            print(\"Applying LoRA to HeAR backbone...\")\n",
        "            self.hear = LoRALinear.apply_lora_to_hear_vit(\n",
        "                self.hear,\n",
        "                r=lora_r,\n",
        "                alpha=lora_alpha,\n",
        "                dropout=lora_dropout,\n",
        "                last_n_blocks=lora_last_n_blocks,\n",
        "                target_modules=['query', 'value']\n",
        "            )\n",
        "        else:\n",
        "            # Freeze entire backbone\n",
        "            for p in self.hear.parameters():\n",
        "                p.requires_grad = False\n",
        "\n",
        "        self.feature_dim = 512\n",
        "\n",
        "        self.gate = GatedAttentionPool(\n",
        "            dim=self.feature_dim,  # Bidirectional doubles the output\n",
        "            attn_hidden=512,\n",
        "            dropout=dropout\n",
        "        )\n",
        "        classifier_input_dim = self.feature_dim\n",
        "        self.classifier = nn.Sequential(\n",
        "            nn.Linear(classifier_input_dim, classifier_input_dim // 2),\n",
        "            nn.GELU(),\n",
        "            nn.Dropout(dropout),\n",
        "            nn.Linear(classifier_input_dim // 2, num_classes)\n",
        "        )\n",
        "\n",
        "        self._print_trainable_params()\n",
        "\n",
        "    def _print_trainable_params(self):\n",
        "        \"\"\"Print trainable parameter statistics\"\"\"\n",
        "        trainable = sum(p.numel() for p in self.parameters() if p.requires_grad)\n",
        "        total = sum(p.numel() for p in self.parameters())\n",
        "\n",
        "        print(f\"\\n{'='*60}\")\n",
        "        print(f\"Model Parameter Summary:\")\n",
        "        print(f\"  Total parameters: {total:,}\")\n",
        "        print(f\"  Trainable parameters: {trainable:,}\")\n",
        "        print(f\"  Frozen parameters: {total - trainable:,}\")\n",
        "        print(f\"  Trainable %: {100 * trainable / total:.2f}%\")\n",
        "        print(f\"{'='*60}\\n\")\n",
        "\n",
        "    def forward(self, spectrogram_seq, lengths):\n",
        "        \"\"\"        Args:\n",
        "        spectrogram_seq: [B, T, 1, 192, 128]\n",
        "        lengths: [B] true lengths (num chunks per file)\n",
        "        \"\"\"\n",
        "        B, T, C, H, W = spectrogram_seq.shape\n",
        "\n",
        "        # Flatten to run HeAR in one pass\n",
        "        x = spectrogram_seq.view(B * T, C, H, W)\n",
        "        outputs = self.hear(x, return_dict=True)\n",
        "        emb = outputs.pooler_output  # [B*T, 512]\n",
        "\n",
        "        # Reshape back to sequence: [B, T, 512]\n",
        "        emb_seq = emb.view(B, T, -1)\n",
        "\n",
        "        # Apply gated attention pooling\n",
        "        pooled_emb, attn = self.gate(emb_seq, lengths)  # [B, rnn_hidden*2], [B, T]\n",
        "\n",
        "        # Classification\n",
        "        logits = self.classifier(pooled_emb)\n",
        "\n",
        "        return logits, attn"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "NZeFi5xED5pl"
      },
      "outputs": [],
      "source": [
        "######## Loss ########\n",
        "class FocalLoss(nn.Module):\n",
        "    \"\"\"\n",
        "    Multi-class Focal Loss.\n",
        "\n",
        "    Args:\n",
        "        gamma (float): focusing parameter (>= 0). Typical values: 1.0–2.0\n",
        "        alpha (Tensor or None): class weights, shape [num_classes]\n",
        "        reduction (str): 'mean', 'sum', or 'none'\n",
        "        eps (float): numerical stability\n",
        "    \"\"\"\n",
        "    def __init__(\n",
        "        self,\n",
        "        gamma: float = 2.0,\n",
        "        alpha: torch.Tensor | None = None,\n",
        "        reduction: str = \"mean\",\n",
        "        eps: float = 1e-8,\n",
        "    ):\n",
        "        super().__init__()\n",
        "        self.gamma = gamma\n",
        "        self.reduction = reduction\n",
        "        self.eps = eps\n",
        "\n",
        "        if alpha is not None:\n",
        "            self.register_buffer(\"alpha\", alpha)\n",
        "        else:\n",
        "            self.alpha = None\n",
        "\n",
        "    def forward(self, logits: torch.Tensor, targets: torch.Tensor) -> torch.Tensor:\n",
        "        \"\"\"\n",
        "        Args:\n",
        "            logits: [B, C] raw model outputs\n",
        "            targets: [B] class indices\n",
        "        \"\"\"\n",
        "        # Log-softmax for numerical stability\n",
        "        log_probs = F.log_softmax(logits, dim=1)\n",
        "        probs = log_probs.exp()\n",
        "\n",
        "        # Select the probabilities of the true classes\n",
        "        targets = targets.view(-1, 1)\n",
        "        log_pt = log_probs.gather(1, targets).squeeze(1)\n",
        "        pt = probs.gather(1, targets).squeeze(1)\n",
        "\n",
        "        # Focal term\n",
        "        focal_term = (1.0 - pt).clamp(min=0.0) ** self.gamma\n",
        "\n",
        "        loss = -focal_term * log_pt\n",
        "\n",
        "        # Apply class weights if provided\n",
        "        if self.alpha is not None:\n",
        "            alpha_t = self.alpha.gather(0, targets.squeeze(1))\n",
        "            loss = alpha_t * loss\n",
        "\n",
        "        if self.reduction == \"mean\":\n",
        "            return loss.mean()\n",
        "        elif self.reduction == \"sum\":\n",
        "            return loss.sum()\n",
        "        else:\n",
        "            return loss\n",
        "import numpy as np\n",
        "\n",
        "def find_best_thresholds_one_vs_rest(probs: np.ndarray,\n",
        "                                    y_true: np.ndarray,\n",
        "                                    num_classes: int,\n",
        "                                    grid_size: int = 101,\n",
        "                                    min_thr: float = 0.05,\n",
        "                                    max_thr: float = 0.95,Pmin =0.3):\n",
        "    \"\"\"\n",
        "    probs: [N, C] softmax probabilities\n",
        "    y_true: [N] int labels in 0..C-1\n",
        "    returns thresholds: [C] float thresholds maximizing F1 per class (one-vs-rest).\n",
        "    \"\"\"\n",
        "    thresholds = np.full(num_classes, 0.5, dtype=np.float32)\n",
        "    grid = np.linspace(min_thr, max_thr, grid_size)\n",
        "\n",
        "    for c in range(num_classes):\n",
        "        y_c = (y_true == c).astype(np.int32)  # one-vs-rest ground truth\n",
        "        p_c = probs[:, c]\n",
        "\n",
        "        best_f1 = -1.0\n",
        "        best_t = 0.5\n",
        "\n",
        "        for t in grid:\n",
        "            pred_c = (p_c >= t).astype(np.int32)\n",
        "\n",
        "            tp = np.sum((pred_c == 1) & (y_c == 1))\n",
        "            fp = np.sum((pred_c == 1) & (y_c == 0))\n",
        "            fn = np.sum((pred_c == 0) & (y_c == 1))\n",
        "\n",
        "            precision = tp / (tp + fp + 1e-12)\n",
        "            recall = tp / (tp + fn + 1e-12)\n",
        "            f1 = (2 * precision * recall) / (precision + recall + 1e-12)\n",
        "\n",
        "            if (precision >= Pmin and (f1 > best_f1 or (abs(f1-best_f1) < 1e-6 and t > best_t))):\n",
        "                best_f1 = f1\n",
        "                best_t = float(t)\n",
        "\n",
        "\n",
        "        thresholds[c] = best_t\n",
        "\n",
        "    return thresholds\n",
        "\n",
        "\n",
        "def predict_with_thresholds(probs: np.ndarray,\n",
        "                            thresholds: np.ndarray,\n",
        "                            abstain: bool = False,\n",
        "                            abstain_label: int | None = None):\n",
        "    \"\"\"\n",
        "    Multi-class decision rule using per-class thresholds.\n",
        "\n",
        "    Strategy:\n",
        "    - Compute margin = probs[:, c] - thresholds[c]\n",
        "    - If abstain=False:\n",
        "        pick argmax margin (always returns a class)\n",
        "    - If abstain=True:\n",
        "        if all margins < 0: return abstain_label (must be provided)\n",
        "        else pick argmax margin among margins\n",
        "    \"\"\"\n",
        "    margins = probs - thresholds.reshape(1, -1)  # [N, C]\n",
        "    best_c = np.argmax(margins, axis=1)\n",
        "    if not abstain:\n",
        "        return best_c\n",
        "\n",
        "    if abstain_label is None:\n",
        "        raise ValueError(\"abstain_label must be set when abstain=True\")\n",
        "\n",
        "    best_margin = np.max(margins, axis=1)\n",
        "    preds = best_c.copy()\n",
        "    preds[best_margin < 0.0] = abstain_label\n",
        "    return preds\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "background_save": true,
          "base_uri": "https://localhost:8080/",
          "height": 1000,
          "referenced_widgets": [
            "d6b8c80f70e24e33b6c2104d82484004",
            "c2fae8d5cbe54bbcbb93d5676f3b4db2",
            "8a9f0e5b71474967a27332869f7a1755",
            "b9f2f16c668b48efa2d019254d709dc3",
            "4cfb4d1f8ea54afa86ff3ce32a4889db",
            "db97babd15c84f3f97822363e857de50",
            "1370324eb86f47e785b4a1e04896e6b1",
            "16ec7b6cf9884aa2a1a77f5dfcb65d7c",
            "817e5330a42748878c92829bbde7a9cd",
            "2fd3c35342ff4fd0b72fbed909bb6cda",
            "8a806bdafb6046b18ce57d80ad413040",
            "a75cd80cecb54ec089a8de2fc59070a6",
            "b9cd2cccec9140319ff16bdcc40a884b",
            "aef1edfd1bf94319879409a909597dcd",
            "bb31de74d6774fdb9bb15b24917e9b4d",
            "e248e7c88b624c369ae18dee0e7d4c3d",
            "2cf91b6aad244705a9721b8704290d4b",
            "e1dc8e90ba904e439af9eaa3f27aff8f",
            "4d3b0629e80a4449870a784b5b62786b",
            "8f6b4022643d4a2b85cf0ff7ca1d39ae",
            "a195f061dde54d0b84bf4bc7af03663f",
            "3c95f65fafad4071ad9a16fdfd2ddab7",
            "e9a5eaf20a8a49e495e90fad044b26fb",
            "3e76226dc5f244d09c6ae03b074a505f",
            "05c3aa1ba9b84307bb8c6d4139fd4265",
            "e9895fad9318457a933fe6ce5e36cb5b",
            "024be6229952428ab2864b3eb55dc117",
            "47ead54cc29e4bb79e520462e69116d3",
            "2f2fa263a30e4ed1b80c06d41b13a29b",
            "066987f87c5b40758d7175504e83566d",
            "a61d354d50a3444388629ce15de0d1c2",
            "c55f046386b7485188c5a23110e93630",
            "48a0e4b5fa85417a92f38b44b162849c"
          ]
        },
        "id": "M2X9bqUbw0lJ",
        "outputId": "5cf6dea9-eeee-4017-b4e3-9e4a00a40488"
      },
      "outputs": [
        {
          "data": {
            "application/vnd.jupyter.widget-view+json": {
              "model_id": "d6b8c80f70e24e33b6c2104d82484004",
              "version_major": 2,
              "version_minor": 0
            },
            "text/plain": [
              "config.json:   0%|          | 0.00/533 [00:00<?, ?B/s]"
            ]
          },
          "metadata": {},
          "output_type": "display_data"
        },
        {
          "data": {
            "application/vnd.jupyter.widget-view+json": {
              "model_id": "a75cd80cecb54ec089a8de2fc59070a6",
              "version_major": 2,
              "version_minor": 0
            },
            "text/plain": [
              "pytorch_model.bin:   0%|          | 0.00/1.21G [00:00<?, ?B/s]"
            ]
          },
          "metadata": {},
          "output_type": "display_data"
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "Exception in thread Thread-auto_conversion:\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/local/lib/python3.12/dist-packages/huggingface_hub/utils/_http.py\", line 657, in hf_raise_for_status\n",
            "    response.raise_for_status()\n",
            "  File \"/usr/local/lib/python3.12/dist-packages/httpx/_models.py\", line 829, in raise_for_status\n",
            "    raise HTTPStatusError(message, request=request, response=self)\n",
            "httpx.HTTPStatusError: Client error '403 Forbidden' for url 'https://huggingface.co/api/models/google/hear-pytorch/discussions?p=0'\n",
            "For more information check: https://developer.mozilla.org/en-US/docs/Web/HTTP/Status/403\n",
            "\n",
            "The above exception was the direct cause of the following exception:\n",
            "\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.12/threading.py\", line 1075, in _bootstrap_inner\n",
            "    self.run()\n",
            "  File \"/usr/lib/python3.12/threading.py\", line 1012, in run\n",
            "    self._target(*self._args, **self._kwargs)\n",
            "  File \"/usr/local/lib/python3.12/dist-packages/transformers/safetensors_conversion.py\", line 116, in auto_conversion\n",
            "    raise e\n",
            "  File \"/usr/local/lib/python3.12/dist-packages/transformers/safetensors_conversion.py\", line 95, in auto_conversion\n",
            "    sha = get_conversion_pr_reference(api, pretrained_model_name_or_path, **cached_file_kwargs)\n",
            "          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n",
            "  File \"/usr/local/lib/python3.12/dist-packages/transformers/safetensors_conversion.py\", line 68, in get_conversion_pr_reference\n",
            "    pr = previous_pr(api, model_id, pr_title, token=token)\n",
            "         ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n",
            "  File \"/usr/local/lib/python3.12/dist-packages/transformers/safetensors_conversion.py\", line 14, in previous_pr\n",
            "    for discussion in get_repo_discussions(repo_id=model_id, token=token):\n",
            "                      ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n",
            "  File \"/usr/local/lib/python3.12/dist-packages/huggingface_hub/hf_api.py\", line 6350, in get_repo_discussions\n",
            "    discussions, has_next = _fetch_discussion_page(page_index=page_index)\n",
            "                            ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n",
            "  File \"/usr/local/lib/python3.12/dist-packages/huggingface_hub/hf_api.py\", line 6339, in _fetch_discussion_page\n",
            "    hf_raise_for_status(resp)\n",
            "  File \"/usr/local/lib/python3.12/dist-packages/huggingface_hub/utils/_http.py\", line 724, in hf_raise_for_status\n",
            "    raise _format(HfHubHTTPError, message, response) from e\n",
            "huggingface_hub.errors.HfHubHTTPError: (Request ID: Root=1-699852e3-151b64875474825470ea6364;ee865584-cffa-4193-8112-a8dc7239b70e)\n",
            "\n",
            "403 Forbidden: Discussions are disabled for this repo.\n",
            "Cannot access content at: https://huggingface.co/api/models/google/hear-pytorch/discussions?p=0.\n",
            "Make sure your token has the correct permissions.\n"
          ]
        },
        {
          "data": {
            "application/vnd.jupyter.widget-view+json": {
              "model_id": "e9a5eaf20a8a49e495e90fad044b26fb",
              "version_major": 2,
              "version_minor": 0
            },
            "text/plain": [
              "Loading weights:   0%|          | 0/392 [00:00<?, ?it/s]"
            ]
          },
          "metadata": {},
          "output_type": "display_data"
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Applying LoRA to HeAR backbone...\n",
            "✓ LoRA applied to 12 attention projections in last 6 blocks\n",
            "  Target modules: ['query', 'value']\n",
            "  LoRA rank: 16, alpha: 16, dropout: 0.3\n",
            "\n",
            "============================================================\n",
            "Model Parameter Summary:\n",
            "  Total parameters: 304,252,675\n",
            "  Trainable parameters: 1,079,555\n",
            "  Frozen parameters: 303,173,120\n",
            "  Trainable %: 0.35%\n",
            "============================================================\n",
            "\n",
            "Creating dataloaders...\n",
            "Loaded 4375 samples from /content/drive/MyDrive/SPRSound/SPRSound-main/train.csv\n",
            "Split: train\n",
            "Target SR: 16000 Hz (HeAR native)\n",
            "Number of classes: 2\n",
            "\n",
            "Class distribution:\n",
            "  [ 1] abnormal            :  1247 (28.50%)\n",
            "  [ 0] normal              :  3128 (71.50%)\n",
            "Loaded 1802 samples from /content/drive/MyDrive/SPRSound/SPRSound-main/val.csv\n",
            "Split: val\n",
            "Target SR: 16000 Hz (HeAR native)\n",
            "Number of classes: 2\n",
            "\n",
            "Class distribution:\n",
            "  [ 1] abnormal            :   483 (26.80%)\n",
            "  [ 0] normal              :  1319 (73.20%)\n",
            "Loaded 940 samples from /content/drive/MyDrive/SPRSound/SPRSound-main/test.csv\n",
            "Split: test\n",
            "Target SR: 16000 Hz (HeAR native)\n",
            "Number of classes: 2\n",
            "\n",
            "Class distribution:\n",
            "  [ 1] abnormal            :   236 (25.11%)\n",
            "  [ 0] normal              :   704 (74.89%)\n",
            "\n",
            "=== CLASS MAP CHECK ===\n",
            "Train: {'normal': 0, 'abnormal': 1}\n",
            "Val:   {'normal': 0, 'abnormal': 1}\n",
            "Test:  {'normal': 0, 'abnormal': 1}\n",
            "train == val ? True\n",
            "train == test? True\n",
            "\n",
            "================================================================================\n",
            "DATALOADERS CREATED\n",
            "================================================================================\n",
            "Train batches: 46\n",
            "Val batches: 19\n",
            "Test batches: 10\n",
            "Loading checkpoint from /content/drive/MyDrive/SPRSound/SPRSound-main/checkpoints/best_model.pth\n",
            "Resumed from epoch 24, best val f1: 0.7807\n",
            "\n",
            "================================================================================\n",
            "STARTING TRAINING\n",
            "================================================================================\n",
            "\n",
            "\n",
            "Epoch 25/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [17:44<00:00, 23.14s/it, lr=4.71e-05, batch=46/46, epoch=24/100, loss=0.1367]\n",
            "train_loss 0.13669420681569888, train_acc 0.7300571428571428, train_f1 0.7297639456500555,train_macro_auc 0.8046749184856321\n",
            "Validation:   5%|5         | 1/19 [01:09<20:58, 69.89s/it, epoch=24/100, batch=1/19, loss=0.1284]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [11:58<00:00, 37.80s/it, epoch=24/100, batch=19/19, loss=0.1374]\n",
            "\n",
            "Epoch 25 Summary:\n",
            "  Train Loss: 0.1367 | Acc: 0.7301 | F1: 0.7298\n",
            "  Val Loss: 0.1374 | Acc: 0.7625 | F1: 0.7660\n",
            "  Val F1 (macro): 0.7067 | Precision: 0.7708 | Recall: 0.7625 | auc macro 0.7877776155786507 | auc micro 0.7877776155786507 \n",
            "  Per-class AUC: {'normal': np.float64(0.7877776155786507), 'abnormal': np.float64(0.7877776155786507)}\n",
            "  Learning Rate: 4.67e-05\n",
            "\n",
            "Epoch 26/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [07:52<00:00, 10.27s/it, lr=4.67e-05, batch=46/46, epoch=25/100, loss=0.1347]\n",
            "train_loss 0.13473614062304082, train_acc 0.7364571428571428, train_f1 0.7353821763124363,train_macro_auc 0.8102887513882278\n",
            "Validation:   5%|5         | 1/19 [00:04<01:21,  4.54s/it, epoch=25/100, batch=1/19, loss=0.1243]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.91s/it, epoch=25/100, batch=19/19, loss=0.1244]\n",
            "\n",
            "Epoch 26 Summary:\n",
            "  Train Loss: 0.1347 | Acc: 0.7365 | F1: 0.7354\n",
            "  Val Loss: 0.1244 | Acc: 0.7930 | F1: 0.7835\n",
            "  Val F1 (macro): 0.7136 | Precision: 0.7816 | Recall: 0.7930 | auc macro 0.7929418264982099 | auc micro 0.7929418264982099 \n",
            "  Per-class AUC: {'normal': np.float64(0.7929418264982099), 'abnormal': np.float64(0.7929418264982099)}\n",
            "  Learning Rate: 4.63e-05\n",
            "✓ Best model saved: /content/drive/MyDrive/SPRSound/SPRSound-main/checkpoints/best_model.pth (metric: 0.7835)\n",
            "EarlyStopping counter: 1/20\n",
            "\n",
            "Epoch 27/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [03:46<00:00,  4.92s/it, lr=4.63e-05, batch=46/46, epoch=26/100, loss=0.1332]\n",
            "train_loss 0.13316683114870734, train_acc 0.7334857142857143, train_f1 0.7333692911486139,train_macro_auc 0.815940189060643\n",
            "Validation:   5%|5         | 1/19 [00:04<01:22,  4.60s/it, epoch=26/100, batch=1/19, loss=0.1225]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.91s/it, epoch=26/100, batch=19/19, loss=0.1267]\n",
            "\n",
            "Epoch 27 Summary:\n",
            "  Train Loss: 0.1332 | Acc: 0.7335 | F1: 0.7334\n",
            "  Val Loss: 0.1267 | Acc: 0.7869 | F1: 0.7804\n",
            "  Val F1 (macro): 0.7127 | Precision: 0.7775 | Recall: 0.7869 | auc macro 0.7908792814683312 | auc micro 0.7908792814683312 \n",
            "  Per-class AUC: {'normal': np.float64(0.7908792814683312), 'abnormal': np.float64(0.7908792814683312)}\n",
            "  Learning Rate: 4.58e-05\n",
            "EarlyStopping counter: 2/20\n",
            "\n",
            "Epoch 28/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [02:40<00:00,  3.49s/it, lr=4.58e-05, batch=46/46, epoch=27/100, loss=0.1318]\n",
            "train_loss 0.13184201992724254, train_acc 0.7385142857142857, train_f1 0.7383464937452324,train_macro_auc 0.8183363636363636\n",
            "Validation:   5%|5         | 1/19 [00:04<01:24,  4.68s/it, epoch=27/100, batch=1/19, loss=0.1316]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=27/100, batch=19/19, loss=0.1493]\n",
            "\n",
            "Epoch 28 Summary:\n",
            "  Train Loss: 0.1318 | Acc: 0.7385 | F1: 0.7383\n",
            "  Val Loss: 0.1493 | Acc: 0.7286 | F1: 0.7409\n",
            "  Val F1 (macro): 0.6904 | Precision: 0.7710 | Recall: 0.7286 | auc macro 0.796602294542104 | auc micro 0.796602294542104 \n",
            "  Per-class AUC: {'normal': np.float64(0.796602294542104), 'abnormal': np.float64(0.796602294542104)}\n",
            "  Learning Rate: 4.53e-05\n",
            "\n",
            "Epoch 29/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [02:03<00:00,  2.69s/it, lr=4.53e-05, batch=46/46, epoch=28/100, loss=0.1353]\n",
            "train_loss 0.1352918444444304, train_acc 0.7309714285714286, train_f1 0.7308537353164684,train_macro_auc 0.8104567794474327\n",
            "Validation:   5%|5         | 1/19 [00:04<01:22,  4.61s/it, epoch=28/100, batch=1/19, loss=0.1274]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.91s/it, epoch=28/100, batch=19/19, loss=0.1406]\n",
            "\n",
            "Epoch 29 Summary:\n",
            "  Train Loss: 0.1353 | Acc: 0.7310 | F1: 0.7309\n",
            "  Val Loss: 0.1406 | Acc: 0.7531 | F1: 0.7604\n",
            "  Val F1 (macro): 0.7054 | Precision: 0.7734 | Recall: 0.7531 | auc macro 0.793492780307561 | auc micro 0.793492780307561 \n",
            "  Per-class AUC: {'normal': np.float64(0.793492780307561), 'abnormal': np.float64(0.793492780307561)}\n",
            "  Learning Rate: 4.48e-05\n",
            "EarlyStopping counter: 1/20\n",
            "\n",
            "Epoch 30/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:52<00:00,  2.45s/it, lr=4.48e-05, batch=46/46, epoch=29/100, loss=0.1307]\n",
            "train_loss 0.13067345499344493, train_acc 0.7497142857142857, train_f1 0.7495999656513024,train_macro_auc 0.8259309317719368\n",
            "Validation:   5%|5         | 1/19 [00:04<01:25,  4.73s/it, epoch=29/100, batch=1/19, loss=0.1230]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=29/100, batch=19/19, loss=0.1221]\n",
            "\n",
            "Epoch 30 Summary:\n",
            "  Train Loss: 0.1307 | Acc: 0.7497 | F1: 0.7496\n",
            "  Val Loss: 0.1221 | Acc: 0.7902 | F1: 0.7752\n",
            "  Val F1 (macro): 0.6974 | Precision: 0.7764 | Recall: 0.7902 | auc macro 0.789052186784329 | auc micro 0.789052186784329 \n",
            "  Per-class AUC: {'normal': np.float64(0.789052186784329), 'abnormal': np.float64(0.789052186784329)}\n",
            "  Learning Rate: 4.43e-05\n",
            "EarlyStopping counter: 2/20\n",
            "\n",
            "Epoch 31/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:54<00:00,  2.50s/it, lr=4.43e-05, batch=46/46, epoch=30/100, loss=0.1381]\n",
            "train_loss 0.13805834657472113, train_acc 0.7254857142857143, train_f1 0.7254521533725813,train_macro_auc 0.8019131664186949\n",
            "Validation:   5%|5         | 1/19 [00:04<01:22,  4.59s/it, epoch=30/100, batch=1/19, loss=0.1285]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.91s/it, epoch=30/100, batch=19/19, loss=0.1411]\n",
            "\n",
            "Epoch 31 Summary:\n",
            "  Train Loss: 0.1381 | Acc: 0.7255 | F1: 0.7255\n",
            "  Val Loss: 0.1411 | Acc: 0.7586 | F1: 0.7654\n",
            "  Val F1 (macro): 0.7111 | Precision: 0.7774 | Recall: 0.7586 | auc macro 0.7959493122495396 | auc micro 0.7959493122495396 \n",
            "  Per-class AUC: {'normal': np.float64(0.7959493122495396), 'abnormal': np.float64(0.7959493122495396)}\n",
            "  Learning Rate: 4.37e-05\n",
            "EarlyStopping counter: 3/20\n",
            "\n",
            "Epoch 32/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:50<00:00,  2.40s/it, lr=4.37e-05, batch=46/46, epoch=31/100, loss=0.1323]\n",
            "train_loss 0.1323186943064565, train_acc 0.7465142857142857, train_f1 0.7459640394628748,train_macro_auc 0.8198879111582236\n",
            "Validation:   5%|5         | 1/19 [00:04<01:23,  4.62s/it, epoch=31/100, batch=1/19, loss=0.1250]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=31/100, batch=19/19, loss=0.1391]\n",
            "\n",
            "Epoch 32 Summary:\n",
            "  Train Loss: 0.1323 | Acc: 0.7465 | F1: 0.7460\n",
            "  Val Loss: 0.1391 | Acc: 0.7564 | F1: 0.7634\n",
            "  Val F1 (macro): 0.7087 | Precision: 0.7757 | Recall: 0.7564 | auc macro 0.8005923930702254 | auc micro 0.8005923930702254 \n",
            "  Per-class AUC: {'normal': np.float64(0.8005923930702254), 'abnormal': np.float64(0.8005923930702254)}\n",
            "  Learning Rate: 4.31e-05\n",
            "EarlyStopping counter: 4/20\n",
            "\n",
            "Epoch 33/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:49<00:00,  2.37s/it, lr=4.31e-05, batch=46/46, epoch=32/100, loss=0.1351]\n",
            "train_loss 0.1350966952741146, train_acc 0.7300571428571428, train_f1 0.7298958757553283,train_macro_auc 0.8137483505105947\n",
            "Validation:   5%|5         | 1/19 [00:04<01:24,  4.67s/it, epoch=32/100, batch=1/19, loss=0.1278]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=32/100, batch=19/19, loss=0.1436]\n",
            "\n",
            "Epoch 33 Summary:\n",
            "  Train Loss: 0.1351 | Acc: 0.7301 | F1: 0.7299\n",
            "  Val Loss: 0.1436 | Acc: 0.7514 | F1: 0.7606\n",
            "  Val F1 (macro): 0.7093 | Precision: 0.7801 | Recall: 0.7514 | auc macro 0.7994339773685127 | auc micro 0.7994339773685127 \n",
            "  Per-class AUC: {'normal': np.float64(0.7994339773685127), 'abnormal': np.float64(0.7994339773685127)}\n",
            "  Learning Rate: 4.25e-05\n",
            "EarlyStopping counter: 5/20\n",
            "\n",
            "Epoch 34/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [02:18<00:00,  3.01s/it, lr=4.25e-05, batch=46/46, epoch=33/100, loss=0.1286]\n",
            "train_loss 0.12855539276548053, train_acc 0.7504, train_f1 0.7501042474533363,train_macro_auc 0.8319556516923206\n",
            "Validation:   5%|5         | 1/19 [00:04<01:22,  4.61s/it, epoch=33/100, batch=1/19, loss=0.1201]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.91s/it, epoch=33/100, batch=19/19, loss=0.1281]\n",
            "\n",
            "Epoch 34 Summary:\n",
            "  Train Loss: 0.1286 | Acc: 0.7504 | F1: 0.7501\n",
            "  Val Loss: 0.1281 | Acc: 0.7836 | F1: 0.7815\n",
            "  Val F1 (macro): 0.7190 | Precision: 0.7798 | Recall: 0.7836 | auc macro 0.7973965470421943 | auc micro 0.7973965470421943 \n",
            "  Per-class AUC: {'normal': np.float64(0.7973965470421943), 'abnormal': np.float64(0.7973965470421943)}\n",
            "  Learning Rate: 4.19e-05\n",
            "EarlyStopping counter: 6/20\n",
            "\n",
            "Epoch 35/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:48<00:00,  2.36s/it, lr=4.19e-05, batch=46/46, epoch=34/100, loss=0.1261]\n",
            "train_loss 0.12614017644006273, train_acc 0.7554285714285714, train_f1 0.7552581295039328,train_macro_auc 0.8403978251655829\n",
            "Validation:   5%|5         | 1/19 [00:04<01:23,  4.65s/it, epoch=34/100, batch=1/19, loss=0.1218]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=34/100, batch=19/19, loss=0.1339]\n",
            "\n",
            "Epoch 35 Summary:\n",
            "  Train Loss: 0.1261 | Acc: 0.7554 | F1: 0.7553\n",
            "  Val Loss: 0.1339 | Acc: 0.7686 | F1: 0.7733\n",
            "  Val F1 (macro): 0.7177 | Precision: 0.7805 | Recall: 0.7686 | auc macro 0.8034052398689641 | auc micro 0.8034052398689641 \n",
            "  Per-class AUC: {'normal': np.float64(0.8034052398689641), 'abnormal': np.float64(0.8034052398689641)}\n",
            "  Learning Rate: 4.12e-05\n",
            "EarlyStopping counter: 7/20\n",
            "\n",
            "Epoch 36/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:49<00:00,  2.38s/it, lr=4.12e-05, batch=46/46, epoch=35/100, loss=0.1300]\n",
            "train_loss 0.1299514798042567, train_acc 0.7545142857142857, train_f1 0.7543547379362915,train_macro_auc 0.8298197592722161\n",
            "Validation:   5%|5         | 1/19 [00:04<01:22,  4.60s/it, epoch=35/100, batch=1/19, loss=0.1225]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.91s/it, epoch=35/100, batch=19/19, loss=0.1339]\n",
            "\n",
            "Epoch 36 Summary:\n",
            "  Train Loss: 0.1300 | Acc: 0.7545 | F1: 0.7544\n",
            "  Val Loss: 0.1339 | Acc: 0.7691 | F1: 0.7727\n",
            "  Val F1 (macro): 0.7152 | Precision: 0.7776 | Recall: 0.7691 | auc macro 0.7974043953870569 | auc micro 0.7974043953870569 \n",
            "  Per-class AUC: {'normal': np.float64(0.7974043953870569), 'abnormal': np.float64(0.7974043953870569)}\n",
            "  Learning Rate: 4.06e-05\n",
            "EarlyStopping counter: 8/20\n",
            "\n",
            "Epoch 37/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:50<00:00,  2.39s/it, lr=4.06e-05, batch=46/46, epoch=36/100, loss=0.1310]\n",
            "train_loss 0.13101088563385216, train_acc 0.7419428571428571, train_f1 0.7410489804725823,train_macro_auc 0.8235992206016828\n",
            "Validation:   5%|5         | 1/19 [00:04<01:23,  4.62s/it, epoch=36/100, batch=1/19, loss=0.1237]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.91s/it, epoch=36/100, batch=19/19, loss=0.1392]\n",
            "\n",
            "Epoch 37 Summary:\n",
            "  Train Loss: 0.1310 | Acc: 0.7419 | F1: 0.7410\n",
            "  Val Loss: 0.1392 | Acc: 0.7669 | F1: 0.7731\n",
            "  Val F1 (macro): 0.7196 | Precision: 0.7836 | Recall: 0.7669 | auc macro 0.8015357641227041 | auc micro 0.8015357641227041 \n",
            "  Per-class AUC: {'normal': np.float64(0.8015357641227041), 'abnormal': np.float64(0.8015357641227041)}\n",
            "  Learning Rate: 3.99e-05\n",
            "EarlyStopping counter: 9/20\n",
            "\n",
            "Epoch 38/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:50<00:00,  2.39s/it, lr=3.99e-05, batch=46/46, epoch=37/100, loss=0.1281]\n",
            "train_loss 0.12811135630244794, train_acc 0.7494857142857143, train_f1 0.7494324419357934,train_macro_auc 0.833071931576078\n",
            "Validation:   5%|5         | 1/19 [00:04<01:25,  4.74s/it, epoch=37/100, batch=1/19, loss=0.1198]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=37/100, batch=19/19, loss=0.1351]\n",
            "\n",
            "Epoch 38 Summary:\n",
            "  Train Loss: 0.1281 | Acc: 0.7495 | F1: 0.7494\n",
            "  Val Loss: 0.1351 | Acc: 0.7703 | F1: 0.7754\n",
            "  Val F1 (macro): 0.7212 | Precision: 0.7837 | Recall: 0.7703 | auc macro 0.8080593083724573 | auc micro 0.8080593083724573 \n",
            "  Per-class AUC: {'normal': np.float64(0.8080593083724573), 'abnormal': np.float64(0.8080593083724573)}\n",
            "  Learning Rate: 3.92e-05\n",
            "EarlyStopping counter: 10/20\n",
            "\n",
            "Epoch 39/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:48<00:00,  2.36s/it, lr=3.92e-05, batch=46/46, epoch=38/100, loss=0.1271]\n",
            "train_loss 0.1271479824638885, train_acc 0.7549714285714286, train_f1 0.7546203096884866,train_macro_auc 0.8358546036344913\n",
            "Validation:   5%|5         | 1/19 [00:04<01:24,  4.67s/it, epoch=38/100, batch=1/19, loss=0.1169]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=38/100, batch=19/19, loss=0.1358]\n",
            "\n",
            "Epoch 39 Summary:\n",
            "  Train Loss: 0.1271 | Acc: 0.7550 | F1: 0.7546\n",
            "  Val Loss: 0.1358 | Acc: 0.7747 | F1: 0.7795\n",
            "  Val F1 (macro): 0.7256 | Precision: 0.7869 | Recall: 0.7747 | auc macro 0.8056875385549942 | auc micro 0.8056875385549942 \n",
            "  Per-class AUC: {'normal': np.float64(0.8056875385549942), 'abnormal': np.float64(0.8056875385549942)}\n",
            "  Learning Rate: 3.85e-05\n",
            "EarlyStopping counter: 11/20\n",
            "\n",
            "Epoch 40/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:49<00:00,  2.38s/it, lr=3.85e-05, batch=46/46, epoch=39/100, loss=0.1278]\n",
            "train_loss 0.1278001819939717, train_acc 0.7538285714285714, train_f1 0.7537454679928759,train_macro_auc 0.8356097650687339\n",
            "Validation:   5%|5         | 1/19 [00:04<01:25,  4.75s/it, epoch=39/100, batch=1/19, loss=0.1160]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=39/100, batch=19/19, loss=0.1283]\n",
            "\n",
            "Epoch 40 Summary:\n",
            "  Train Loss: 0.1278 | Acc: 0.7538 | F1: 0.7537\n",
            "  Val Loss: 0.1283 | Acc: 0.7863 | F1: 0.7860\n",
            "  Val F1 (macro): 0.7269 | Precision: 0.7857 | Recall: 0.7863 | auc macro 0.8091455193014345 | auc micro 0.8091455193014345 \n",
            "  Per-class AUC: {'normal': np.float64(0.8091455193014345), 'abnormal': np.float64(0.8091455193014345)}\n",
            "  Learning Rate: 3.78e-05\n",
            "✓ Best model saved: /content/drive/MyDrive/SPRSound/SPRSound-main/checkpoints/best_model.pth (metric: 0.7860)\n",
            "EarlyStopping counter: 12/20\n",
            "\n",
            "Epoch 41/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:52<00:00,  2.44s/it, lr=3.78e-05, batch=46/46, epoch=40/100, loss=0.1301]\n",
            "train_loss 0.1300958952178126, train_acc 0.7501714285714286, train_f1 0.7495298639586607,train_macro_auc 0.8292786754923707\n",
            "Validation:   5%|5         | 1/19 [00:04<01:24,  4.70s/it, epoch=40/100, batch=1/19, loss=0.1136]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=40/100, batch=19/19, loss=0.1214]\n",
            "\n",
            "Epoch 41 Summary:\n",
            "  Train Loss: 0.1301 | Acc: 0.7502 | F1: 0.7495\n",
            "  Val Loss: 0.1214 | Acc: 0.7986 | F1: 0.7945\n",
            "  Val F1 (macro): 0.7334 | Precision: 0.7922 | Recall: 0.7986 | auc macro 0.8097969319250264 | auc micro 0.8097969319250264 \n",
            "  Per-class AUC: {'normal': np.float64(0.8097969319250264), 'abnormal': np.float64(0.8097969319250264)}\n",
            "  Learning Rate: 3.70e-05\n",
            "✓ Best model saved: /content/drive/MyDrive/SPRSound/SPRSound-main/checkpoints/best_model.pth (metric: 0.7945)\n",
            "EarlyStopping counter: 13/20\n",
            "\n",
            "Epoch 42/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [02:00<00:00,  2.61s/it, lr=3.70e-05, batch=46/46, epoch=41/100, loss=0.1269]\n",
            "train_loss 0.12694751098752022, train_acc 0.7625142857142857, train_f1 0.7622329269812209,train_macro_auc 0.8381250266448993\n",
            "Validation:   5%|5         | 1/19 [00:04<01:23,  4.63s/it, epoch=41/100, batch=1/19, loss=0.1172]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.91s/it, epoch=41/100, batch=19/19, loss=0.1283]\n",
            "\n",
            "Epoch 42 Summary:\n",
            "  Train Loss: 0.1269 | Acc: 0.7625 | F1: 0.7622\n",
            "  Val Loss: 0.1283 | Acc: 0.7614 | F1: 0.7695\n",
            "  Val F1 (macro): 0.7187 | Precision: 0.7861 | Recall: 0.7614 | auc macro 0.8081942999040931 | auc micro 0.8081942999040931 \n",
            "  Per-class AUC: {'normal': np.float64(0.8081942999040931), 'abnormal': np.float64(0.8081942999040931)}\n",
            "  Learning Rate: 3.62e-05\n",
            "EarlyStopping counter: 14/20\n",
            "\n",
            "Epoch 43/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:49<00:00,  2.39s/it, lr=3.62e-05, batch=46/46, epoch=42/100, loss=0.1273]\n",
            "train_loss 0.12725647619884947, train_acc 0.7613714285714286, train_f1 0.7612329586380007,train_macro_auc 0.8402295881474199\n",
            "Validation:   5%|5         | 1/19 [00:04<01:22,  4.61s/it, epoch=42/100, batch=1/19, loss=0.1149]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.91s/it, epoch=42/100, batch=19/19, loss=0.1294]\n",
            "\n",
            "Epoch 43 Summary:\n",
            "  Train Loss: 0.1273 | Acc: 0.7614 | F1: 0.7612\n",
            "  Val Loss: 0.1294 | Acc: 0.7531 | F1: 0.7626\n",
            "  Val F1 (macro): 0.7125 | Precision: 0.7837 | Recall: 0.7531 | auc macro 0.8096383953588027 | auc micro 0.8096383953588027 \n",
            "  Per-class AUC: {'normal': np.float64(0.8096383953588027), 'abnormal': np.float64(0.8096383953588027)}\n",
            "  Learning Rate: 3.55e-05\n",
            "EarlyStopping counter: 15/20\n",
            "\n",
            "Epoch 44/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:49<00:00,  2.37s/it, lr=3.55e-05, batch=46/46, epoch=43/100, loss=0.1214]\n",
            "train_loss 0.12141808527319328, train_acc 0.7698285714285714, train_f1 0.7697587201779238,train_macro_auc 0.8532620556274645\n",
            "Validation:   5%|5         | 1/19 [00:04<01:23,  4.65s/it, epoch=43/100, batch=1/19, loss=0.1132]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=43/100, batch=19/19, loss=0.1252]\n",
            "\n",
            "Epoch 44 Summary:\n",
            "  Train Loss: 0.1214 | Acc: 0.7698 | F1: 0.7698\n",
            "  Val Loss: 0.1252 | Acc: 0.7758 | F1: 0.7796\n",
            "  Val F1 (macro): 0.7244 | Precision: 0.7851 | Recall: 0.7758 | auc macro 0.8066293399385003 | auc micro 0.8066293399385003 \n",
            "  Per-class AUC: {'normal': np.float64(0.8066293399385003), 'abnormal': np.float64(0.8066293399385003)}\n",
            "  Learning Rate: 3.47e-05\n",
            "EarlyStopping counter: 16/20\n",
            "\n",
            "Epoch 45/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:49<00:00,  2.37s/it, lr=3.47e-05, batch=46/46, epoch=44/100, loss=0.1259]\n",
            "train_loss 0.12593740483988886, train_acc 0.7570285714285714, train_f1 0.756859158320604,train_macro_auc 0.8400198852366435\n",
            "Validation:   5%|5         | 1/19 [00:04<01:24,  4.70s/it, epoch=44/100, batch=1/19, loss=0.1126]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=44/100, batch=19/19, loss=0.1266]\n",
            "\n",
            "Epoch 45 Summary:\n",
            "  Train Loss: 0.1259 | Acc: 0.7570 | F1: 0.7569\n",
            "  Val Loss: 0.1266 | Acc: 0.7725 | F1: 0.7774\n",
            "  Val F1 (macro): 0.7232 | Precision: 0.7851 | Recall: 0.7725 | auc macro 0.8074926578733811 | auc micro 0.8074926578733811 \n",
            "  Per-class AUC: {'normal': np.float64(0.8074926578733811), 'abnormal': np.float64(0.8074926578733811)}\n",
            "  Learning Rate: 3.39e-05\n",
            "EarlyStopping counter: 17/20\n",
            "\n",
            "Epoch 46/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:51<00:00,  2.42s/it, lr=3.39e-05, batch=46/46, epoch=45/100, loss=0.1232]\n",
            "train_loss 0.1231830031003641, train_acc 0.7677714285714285, train_f1 0.7677102755572275,train_macro_auc 0.8502682664371481\n",
            "Validation:   5%|5         | 1/19 [00:04<01:25,  4.72s/it, epoch=45/100, batch=1/19, loss=0.1220]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=45/100, batch=19/19, loss=0.1495]\n",
            "\n",
            "Epoch 46 Summary:\n",
            "  Train Loss: 0.1232 | Acc: 0.7678 | F1: 0.7677\n",
            "  Val Loss: 0.1495 | Acc: 0.6792 | F1: 0.6975\n",
            "  Val F1 (macro): 0.6581 | Precision: 0.7767 | Recall: 0.6792 | auc macro 0.810131271416171 | auc micro 0.810131271416171 \n",
            "  Per-class AUC: {'normal': np.float64(0.810131271416171), 'abnormal': np.float64(0.810131271416171)}\n",
            "  Learning Rate: 3.31e-05\n",
            "\n",
            "Epoch 47/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:51<00:00,  2.42s/it, lr=3.31e-05, batch=46/46, epoch=46/100, loss=0.1220]\n",
            "train_loss 0.12196760316905768, train_acc 0.768, train_f1 0.7678942291684274,train_macro_auc 0.8538491904932274\n",
            "Validation:   5%|5         | 1/19 [00:04<01:25,  4.72s/it, epoch=46/100, batch=1/19, loss=0.1113]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=46/100, batch=19/19, loss=0.1280]\n",
            "\n",
            "Epoch 47 Summary:\n",
            "  Train Loss: 0.1220 | Acc: 0.7680 | F1: 0.7679\n",
            "  Val Loss: 0.1280 | Acc: 0.7653 | F1: 0.7717\n",
            "  Val F1 (macro): 0.7184 | Precision: 0.7830 | Recall: 0.7653 | auc macro 0.807034314533408 | auc micro 0.807034314533408 \n",
            "  Per-class AUC: {'normal': np.float64(0.807034314533408), 'abnormal': np.float64(0.807034314533408)}\n",
            "  Learning Rate: 3.23e-05\n",
            "EarlyStopping counter: 1/20\n",
            "\n",
            "Epoch 48/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:50<00:00,  2.40s/it, lr=3.23e-05, batch=46/46, epoch=47/100, loss=0.1240]\n",
            "train_loss 0.12404598846383717, train_acc 0.7616, train_f1 0.7611898245049274,train_macro_auc 0.8477740411662573\n",
            "Validation:   5%|5         | 1/19 [00:04<01:22,  4.61s/it, epoch=47/100, batch=1/19, loss=0.1126]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.91s/it, epoch=47/100, batch=19/19, loss=0.1321]\n",
            "\n",
            "Epoch 48 Summary:\n",
            "  Train Loss: 0.1240 | Acc: 0.7616 | F1: 0.7612\n",
            "  Val Loss: 0.1321 | Acc: 0.7475 | F1: 0.7580\n",
            "  Val F1 (macro): 0.7085 | Precision: 0.7826 | Recall: 0.7475 | auc macro 0.8163047794850543 | auc micro 0.8163047794850543 \n",
            "  Per-class AUC: {'normal': np.float64(0.8163047794850543), 'abnormal': np.float64(0.8163047794850543)}\n",
            "  Learning Rate: 3.14e-05\n",
            "EarlyStopping counter: 2/20\n",
            "\n",
            "Epoch 49/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:48<00:00,  2.37s/it, lr=3.14e-05, batch=46/46, epoch=48/100, loss=0.1252]\n",
            "train_loss 0.1251622814199199, train_acc 0.7577142857142857, train_f1 0.7577323620295395,train_macro_auc 0.8421024022532311\n",
            "Validation:   5%|5         | 1/19 [00:04<01:27,  4.84s/it, epoch=48/100, batch=1/19, loss=0.1133]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.93s/it, epoch=48/100, batch=19/19, loss=0.1341]\n",
            "\n",
            "Epoch 49 Summary:\n",
            "  Train Loss: 0.1252 | Acc: 0.7577 | F1: 0.7577\n",
            "  Val Loss: 0.1341 | Acc: 0.7370 | F1: 0.7495\n",
            "  Val F1 (macro): 0.7027 | Precision: 0.7841 | Recall: 0.7370 | auc macro 0.8142469434620931 | auc micro 0.8142469434620931 \n",
            "  Per-class AUC: {'normal': np.float64(0.8142469434620931), 'abnormal': np.float64(0.8142469434620931)}\n",
            "  Learning Rate: 3.06e-05\n",
            "EarlyStopping counter: 3/20\n",
            "\n",
            "Epoch 50/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:50<00:00,  2.40s/it, lr=3.06e-05, batch=46/46, epoch=49/100, loss=0.1237]\n",
            "train_loss 0.12373895343878995, train_acc 0.7657142857142857, train_f1 0.7656052233692923,train_macro_auc 0.8484370519070835\n",
            "Validation:   5%|5         | 1/19 [00:04<01:26,  4.81s/it, epoch=49/100, batch=1/19, loss=0.1120]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.93s/it, epoch=49/100, batch=19/19, loss=0.1319]\n",
            "\n",
            "Epoch 50 Summary:\n",
            "  Train Loss: 0.1237 | Acc: 0.7657 | F1: 0.7656\n",
            "  Val Loss: 0.1319 | Acc: 0.7519 | F1: 0.7618\n",
            "  Val F1 (macro): 0.7123 | Precision: 0.7845 | Recall: 0.7519 | auc macro 0.8112394577107634 | auc micro 0.8112394577107634 \n",
            "  Per-class AUC: {'normal': np.float64(0.8112394577107634), 'abnormal': np.float64(0.8112394577107634)}\n",
            "  Learning Rate: 2.98e-05\n",
            "EarlyStopping counter: 4/20\n",
            "\n",
            "Epoch 51/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:50<00:00,  2.41s/it, lr=2.98e-05, batch=46/46, epoch=50/100, loss=0.1246]\n",
            "train_loss 0.12455410899027534, train_acc 0.7584, train_f1 0.7581397138298029,train_macro_auc 0.8434447558883822\n",
            "Validation:   5%|5         | 1/19 [00:04<01:24,  4.72s/it, epoch=50/100, batch=1/19, loss=0.1104]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=50/100, batch=19/19, loss=0.1244]\n",
            "\n",
            "Epoch 51 Summary:\n",
            "  Train Loss: 0.1246 | Acc: 0.7584 | F1: 0.7581\n",
            "  Val Loss: 0.1244 | Acc: 0.7752 | F1: 0.7802\n",
            "  Val F1 (macro): 0.7268 | Precision: 0.7880 | Recall: 0.7752 | auc macro 0.8138576655569106 | auc micro 0.8138576655569106 \n",
            "  Per-class AUC: {'normal': np.float64(0.8138576655569106), 'abnormal': np.float64(0.8138576655569106)}\n",
            "  Learning Rate: 2.89e-05\n",
            "EarlyStopping counter: 5/20\n",
            "\n",
            "Epoch 52/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:49<00:00,  2.38s/it, lr=2.89e-05, batch=46/46, epoch=51/100, loss=0.1237]\n",
            "train_loss 0.12371515272104222, train_acc 0.7716571428571428, train_f1 0.7714475133500326,train_macro_auc 0.8493825488657005\n",
            "Validation:   5%|5         | 1/19 [00:04<01:26,  4.81s/it, epoch=51/100, batch=1/19, loss=0.1097]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.93s/it, epoch=51/100, batch=19/19, loss=0.1237]\n",
            "\n",
            "Epoch 52 Summary:\n",
            "  Train Loss: 0.1237 | Acc: 0.7717 | F1: 0.7714\n",
            "  Val Loss: 0.1237 | Acc: 0.7791 | F1: 0.7833\n",
            "  Val F1 (macro): 0.7295 | Precision: 0.7894 | Recall: 0.7791 | auc macro 0.8141370666340174 | auc micro 0.8141370666340174 \n",
            "  Per-class AUC: {'normal': np.float64(0.8141370666340174), 'abnormal': np.float64(0.8141370666340174)}\n",
            "  Learning Rate: 2.81e-05\n",
            "EarlyStopping counter: 6/20\n",
            "\n",
            "Epoch 53/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:51<00:00,  2.43s/it, lr=2.81e-05, batch=46/46, epoch=52/100, loss=0.1207]\n",
            "train_loss 0.12068190603800442, train_acc 0.7796571428571428, train_f1 0.7794169740776237,train_macro_auc 0.8572221058892222\n",
            "Validation:   5%|5         | 1/19 [00:04<01:26,  4.82s/it, epoch=52/100, batch=1/19, loss=0.1122]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=52/100, batch=19/19, loss=0.1359]\n",
            "\n",
            "Epoch 53 Summary:\n",
            "  Train Loss: 0.1207 | Acc: 0.7797 | F1: 0.7794\n",
            "  Val Loss: 0.1359 | Acc: 0.7370 | F1: 0.7493\n",
            "  Val F1 (macro): 0.7016 | Precision: 0.7821 | Recall: 0.7370 | auc macro 0.8123774677158335 | auc micro 0.8123774677158335 \n",
            "  Per-class AUC: {'normal': np.float64(0.8123774677158335), 'abnormal': np.float64(0.8123774677158335)}\n",
            "  Learning Rate: 2.72e-05\n",
            "EarlyStopping counter: 7/20\n",
            "\n",
            "Epoch 54/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:51<00:00,  2.42s/it, lr=2.72e-05, batch=46/46, epoch=53/100, loss=0.1251]\n",
            "train_loss 0.12507429103488507, train_acc 0.7652571428571429, train_f1 0.7651198930892305,train_macro_auc 0.8458850574712644\n",
            "Validation:   5%|5         | 1/19 [00:04<01:24,  4.72s/it, epoch=53/100, batch=1/19, loss=0.1081]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=53/100, batch=19/19, loss=0.1249]\n",
            "\n",
            "Epoch 54 Summary:\n",
            "  Train Loss: 0.1251 | Acc: 0.7653 | F1: 0.7651\n",
            "  Val Loss: 0.1249 | Acc: 0.7703 | F1: 0.7761\n",
            "  Val F1 (macro): 0.7230 | Precision: 0.7860 | Recall: 0.7703 | auc macro 0.8151667694799842 | auc micro 0.8151667694799842 \n",
            "  Per-class AUC: {'normal': np.float64(0.8151667694799842), 'abnormal': np.float64(0.8151667694799842)}\n",
            "  Learning Rate: 2.64e-05\n",
            "EarlyStopping counter: 8/20\n",
            "\n",
            "Epoch 55/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:50<00:00,  2.40s/it, lr=2.64e-05, batch=46/46, epoch=54/100, loss=0.1218]\n",
            "train_loss 0.12184809180705444, train_acc 0.7707428571428572, train_f1 0.7704979476339313,train_macro_auc 0.852970743792602\n",
            "Validation:   5%|5         | 1/19 [00:04<01:23,  4.65s/it, epoch=54/100, batch=1/19, loss=0.1096]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=54/100, batch=19/19, loss=0.1233]\n",
            "\n",
            "Epoch 55 Summary:\n",
            "  Train Loss: 0.1218 | Acc: 0.7707 | F1: 0.7705\n",
            "  Val Loss: 0.1233 | Acc: 0.7786 | F1: 0.7823\n",
            "  Val F1 (macro): 0.7277 | Precision: 0.7876 | Recall: 0.7786 | auc macro 0.8110212737235845 | auc micro 0.8110212737235845 \n",
            "  Per-class AUC: {'normal': np.float64(0.8110212737235845), 'abnormal': np.float64(0.8110212737235845)}\n",
            "  Learning Rate: 2.55e-05\n",
            "EarlyStopping counter: 9/20\n",
            "\n",
            "Epoch 56/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:49<00:00,  2.38s/it, lr=2.55e-05, batch=46/46, epoch=55/100, loss=0.1228]\n",
            "train_loss 0.12277322392100873, train_acc 0.7741714285714286, train_f1 0.7739612994953543,train_macro_auc 0.8509859510491469\n",
            "Validation:   5%|5         | 1/19 [00:04<01:25,  4.74s/it, epoch=55/100, batch=1/19, loss=0.1094]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=55/100, batch=19/19, loss=0.1224]\n",
            "\n",
            "Epoch 56 Summary:\n",
            "  Train Loss: 0.1228 | Acc: 0.7742 | F1: 0.7740\n",
            "  Val Loss: 0.1224 | Acc: 0.7808 | F1: 0.7846\n",
            "  Val F1 (macro): 0.7307 | Precision: 0.7901 | Recall: 0.7808 | auc macro 0.8160190997320577 | auc micro 0.8160190997320577 \n",
            "  Per-class AUC: {'normal': np.float64(0.8160190997320577), 'abnormal': np.float64(0.8160190997320577)}\n",
            "  Learning Rate: 2.46e-05\n",
            "EarlyStopping counter: 10/20\n",
            "\n",
            "Epoch 57/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:50<00:00,  2.41s/it, lr=2.46e-05, batch=46/46, epoch=56/100, loss=0.1247]\n",
            "train_loss 0.1246565972333369, train_acc 0.7648, train_f1 0.7643837958181996,train_macro_auc 0.8448110687836528\n",
            "Validation:   5%|5         | 1/19 [00:04<01:25,  4.73s/it, epoch=56/100, batch=1/19, loss=0.1083]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=56/100, batch=19/19, loss=0.1218]\n",
            "\n",
            "Epoch 57 Summary:\n",
            "  Train Loss: 0.1247 | Acc: 0.7648 | F1: 0.7644\n",
            "  Val Loss: 0.1218 | Acc: 0.7863 | F1: 0.7886\n",
            "  Val F1 (macro): 0.7337 | Precision: 0.7916 | Recall: 0.7863 | auc macro 0.8148442025061335 | auc micro 0.8148442025061335 \n",
            "  Per-class AUC: {'normal': np.float64(0.8148442025061335), 'abnormal': np.float64(0.8148442025061335)}\n",
            "  Learning Rate: 2.38e-05\n",
            "EarlyStopping counter: 11/20\n",
            "\n",
            "Epoch 58/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:49<00:00,  2.39s/it, lr=2.38e-05, batch=46/46, epoch=57/100, loss=0.1210]\n",
            "train_loss 0.12101604093028151, train_acc 0.7682285714285715, train_f1 0.768272481348581,train_macro_auc 0.855901769652345\n",
            "Validation:   5%|5         | 1/19 [00:04<01:24,  4.68s/it, epoch=57/100, batch=1/19, loss=0.1075]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=57/100, batch=19/19, loss=0.1205]\n",
            "\n",
            "Epoch 58 Summary:\n",
            "  Train Loss: 0.1210 | Acc: 0.7682 | F1: 0.7683\n",
            "  Val Loss: 0.1205 | Acc: 0.7875 | F1: 0.7894\n",
            "  Val F1 (macro): 0.7341 | Precision: 0.7917 | Recall: 0.7875 | auc macro 0.8168337579287905 | auc micro 0.8168337579287905 \n",
            "  Per-class AUC: {'normal': np.float64(0.8168337579287905), 'abnormal': np.float64(0.8168337579287905)}\n",
            "  Learning Rate: 2.29e-05\n",
            "EarlyStopping counter: 12/20\n",
            "\n",
            "Epoch 59/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:53<00:00,  2.46s/it, lr=2.29e-05, batch=46/46, epoch=58/100, loss=0.1189]\n",
            "train_loss 0.11888219772473625, train_acc 0.7762285714285714, train_f1 0.7755460071417009,train_macro_auc 0.8595861118922321\n",
            "Validation:   5%|5         | 1/19 [00:04<01:24,  4.72s/it, epoch=58/100, batch=1/19, loss=0.1060]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=58/100, batch=19/19, loss=0.1182]\n",
            "\n",
            "Epoch 59 Summary:\n",
            "  Train Loss: 0.1189 | Acc: 0.7762 | F1: 0.7755\n",
            "  Val Loss: 0.1182 | Acc: 0.7963 | F1: 0.7947\n",
            "  Val F1 (macro): 0.7364 | Precision: 0.7934 | Recall: 0.7963 | auc macro 0.8167505654732474 | auc micro 0.8167505654732474 \n",
            "  Per-class AUC: {'normal': np.float64(0.8167505654732474), 'abnormal': np.float64(0.8167505654732474)}\n",
            "  Learning Rate: 2.21e-05\n",
            "✓ Best model saved: /content/drive/MyDrive/SPRSound/SPRSound-main/checkpoints/best_model.pth (metric: 0.7947)\n",
            "EarlyStopping counter: 13/20\n",
            "\n",
            "Epoch 60/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:57<00:00,  2.55s/it, lr=2.21e-05, batch=46/46, epoch=59/100, loss=0.1226]\n",
            "train_loss 0.12259728558685469, train_acc 0.7734857142857143, train_f1 0.7731915603473407,train_macro_auc 0.8515408006520581\n",
            "Validation:   5%|5         | 1/19 [00:04<01:25,  4.74s/it, epoch=59/100, batch=1/19, loss=0.1092]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=59/100, batch=19/19, loss=0.1287]\n",
            "\n",
            "Epoch 60 Summary:\n",
            "  Train Loss: 0.1226 | Acc: 0.7735 | F1: 0.7732\n",
            "  Val Loss: 0.1287 | Acc: 0.7586 | F1: 0.7677\n",
            "  Val F1 (macro): 0.7181 | Precision: 0.7876 | Recall: 0.7586 | auc macro 0.8200578579983268 | auc micro 0.8200578579983268 \n",
            "  Per-class AUC: {'normal': np.float64(0.8200578579983268), 'abnormal': np.float64(0.8200578579983268)}\n",
            "  Learning Rate: 2.12e-05\n",
            "EarlyStopping counter: 14/20\n",
            "\n",
            "Epoch 61/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:54<00:00,  2.50s/it, lr=2.12e-05, batch=46/46, epoch=60/100, loss=0.1212]\n",
            "train_loss 0.12117889296749364, train_acc 0.7753142857142857, train_f1 0.7749182828729205,train_macro_auc 0.854181370712551\n",
            "Validation:   5%|5         | 1/19 [00:04<01:26,  4.81s/it, epoch=60/100, batch=1/19, loss=0.1061]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=60/100, batch=19/19, loss=0.1198]\n",
            "\n",
            "Epoch 61 Summary:\n",
            "  Train Loss: 0.1212 | Acc: 0.7753 | F1: 0.7749\n",
            "  Val Loss: 0.1198 | Acc: 0.7869 | F1: 0.7888\n",
            "  Val F1 (macro): 0.7333 | Precision: 0.7910 | Recall: 0.7869 | auc macro 0.8202022675437977 | auc micro 0.8202022675437977 \n",
            "  Per-class AUC: {'normal': np.float64(0.8202022675437977), 'abnormal': np.float64(0.8202022675437977)}\n",
            "  Learning Rate: 2.04e-05\n",
            "EarlyStopping counter: 15/20\n",
            "\n",
            "Epoch 62/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:52<00:00,  2.46s/it, lr=2.04e-05, batch=46/46, epoch=61/100, loss=0.1196]\n",
            "train_loss 0.11960462934297064, train_acc 0.7830857142857143, train_f1 0.7830177668540758,train_macro_auc 0.8612355239466148\n",
            "Validation:   5%|5         | 1/19 [00:04<01:25,  4.75s/it, epoch=61/100, batch=1/19, loss=0.1103]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=61/100, batch=19/19, loss=0.1315]\n",
            "\n",
            "Epoch 62 Summary:\n",
            "  Train Loss: 0.1196 | Acc: 0.7831 | F1: 0.7830\n",
            "  Val Loss: 0.1315 | Acc: 0.7442 | F1: 0.7554\n",
            "  Val F1 (macro): 0.7068 | Precision: 0.7832 | Recall: 0.7442 | auc macro 0.8199212967977183 | auc micro 0.8199212967977183 \n",
            "  Per-class AUC: {'normal': np.float64(0.8199212967977183), 'abnormal': np.float64(0.8199212967977183)}\n",
            "  Learning Rate: 1.96e-05\n",
            "EarlyStopping counter: 16/20\n",
            "\n",
            "Epoch 63/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:52<00:00,  2.44s/it, lr=1.96e-05, batch=46/46, epoch=62/100, loss=0.1213]\n",
            "train_loss 0.12133543047568073, train_acc 0.7700571428571429, train_f1 0.7700813623108326,train_macro_auc 0.8555178937180529\n",
            "Validation:   5%|5         | 1/19 [00:04<01:26,  4.78s/it, epoch=62/100, batch=1/19, loss=0.1077]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=62/100, batch=19/19, loss=0.1212]\n",
            "\n",
            "Epoch 63 Summary:\n",
            "  Train Loss: 0.1213 | Acc: 0.7701 | F1: 0.7701\n",
            "  Val Loss: 0.1212 | Acc: 0.7858 | F1: 0.7886\n",
            "  Val F1 (macro): 0.7345 | Precision: 0.7925 | Recall: 0.7858 | auc macro 0.8185988506883782 | auc micro 0.8185988506883782 \n",
            "  Per-class AUC: {'normal': np.float64(0.8185988506883782), 'abnormal': np.float64(0.8185988506883782)}\n",
            "  Learning Rate: 1.87e-05\n",
            "EarlyStopping counter: 17/20\n",
            "\n",
            "Epoch 64/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:50<00:00,  2.40s/it, lr=1.87e-05, batch=46/46, epoch=63/100, loss=0.1218]\n",
            "train_loss 0.1218035637360552, train_acc 0.7661714285714286, train_f1 0.7659970833679455,train_macro_auc 0.8516330570332798\n",
            "Validation:   5%|5         | 1/19 [00:04<01:26,  4.82s/it, epoch=63/100, batch=1/19, loss=0.1096]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.93s/it, epoch=63/100, batch=19/19, loss=0.1278]\n",
            "\n",
            "Epoch 64 Summary:\n",
            "  Train Loss: 0.1218 | Acc: 0.7662 | F1: 0.7660\n",
            "  Val Loss: 0.1278 | Acc: 0.7647 | F1: 0.7734\n",
            "  Val F1 (macro): 0.7248 | Precision: 0.7927 | Recall: 0.7647 | auc macro 0.8207375246634236 | auc micro 0.8207375246634236 \n",
            "  Per-class AUC: {'normal': np.float64(0.8207375246634236), 'abnormal': np.float64(0.8207375246634236)}\n",
            "  Learning Rate: 1.79e-05\n",
            "EarlyStopping counter: 18/20\n",
            "\n",
            "Epoch 65/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:50<00:00,  2.41s/it, lr=1.79e-05, batch=46/46, epoch=64/100, loss=0.1204]\n",
            "train_loss 0.12036905810236931, train_acc 0.7698285714285714, train_f1 0.7693856425250144,train_macro_auc 0.8554321976969578\n",
            "Validation:   5%|5         | 1/19 [00:04<01:24,  4.70s/it, epoch=64/100, batch=1/19, loss=0.1058]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=64/100, batch=19/19, loss=0.1198]\n",
            "\n",
            "Epoch 65 Summary:\n",
            "  Train Loss: 0.1204 | Acc: 0.7698 | F1: 0.7694\n",
            "  Val Loss: 0.1198 | Acc: 0.7902 | F1: 0.7912\n",
            "  Val F1 (macro): 0.7351 | Precision: 0.7922 | Recall: 0.7902 | auc macro 0.8178760181265372 | auc micro 0.8178760181265372 \n",
            "  Per-class AUC: {'normal': np.float64(0.8178760181265372), 'abnormal': np.float64(0.8178760181265372)}\n",
            "  Learning Rate: 1.71e-05\n",
            "EarlyStopping counter: 19/20\n",
            "\n",
            "Epoch 66/100\n",
            "--------------------------------------------------------------------------------\n",
            "Training: 100%|##########| 46/46 [01:51<00:00,  2.42s/it, lr=1.71e-05, batch=46/46, epoch=65/100, loss=0.1229]\n",
            "train_loss 0.12288833069412605, train_acc 0.7682285714285715, train_f1 0.7678597334674052,train_macro_auc 0.8516681107283964\n",
            "Validation:   5%|5         | 1/19 [00:04<01:26,  4.78s/it, epoch=65/100, batch=1/19, loss=0.1081]"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/tmp/ipython-input-2947038974.py:119: DeprecationWarning: __array_wrap__ must accept context and return_scalar arguments (positionally) in the future. (Deprecated NumPy 2.0)\n",
            "  margins = probs - thresholds.reshape(1, -1)  # [N, C]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Validation: 100%|##########| 19/19 [00:36<00:00,  1.92s/it, epoch=65/100, batch=19/19, loss=0.1237]\n",
            "\n",
            "Epoch 66 Summary:\n",
            "  Train Loss: 0.1229 | Acc: 0.7682 | F1: 0.7679\n",
            "  Val Loss: 0.1237 | Acc: 0.7780 | F1: 0.7837\n",
            "  Val F1 (macro): 0.7324 | Precision: 0.7935 | Recall: 0.7780 | auc macro 0.8202838903303682 | auc micro 0.8202838903303682 \n",
            "  Per-class AUC: {'normal': np.float64(0.8202838903303682), 'abnormal': np.float64(0.8202838903303682)}\n",
            "  Learning Rate: 1.63e-05\n",
            "EarlyStopping counter: 20/20\n",
            "\n",
            "================================================================================\n",
            "Early stopping triggered at epoch 66\n",
            "Best validation F1: 0.7947\n",
            "================================================================================\n",
            "\n",
            "\n",
            "================================================================================\n",
            "TRAINING COMPLETED\n",
            "Best validation F1: 0.7947\n",
            "================================================================================\n",
            "\n"
          ]
        }
      ],
      "source": [
        "#################### Trainer ########################\n",
        "\n",
        "class RespiratoryTrainer:\n",
        "    def __init__(self, configs={}):\n",
        "        self.configs = configs\n",
        "        os.makedirs(configs[\"logdir\"], exist_ok=True)\n",
        "\n",
        "        # Setup logging\n",
        "        log_path_train = os.path.join(configs[\"logdir\"], \"training_log.txt\")\n",
        "        log_path_val = os.path.join(configs[\"logdir\"], \"val_log.txt\")\n",
        "        log_path_test = os.path.join(configs[\"logdir\"], \"test_log.txt\")\n",
        "\n",
        "        self.traintee = TeeFile(sys.stdout, log_path_train)\n",
        "        self.valtee = TeeFile(sys.stdout, log_path_val)\n",
        "        self.testtee = TeeFile(sys.stdout, log_path_test)\n",
        "\n",
        "        # Create directories\n",
        "        for dir in self.configs[\"dirsToMake\"]:\n",
        "            os.makedirs(dir, exist_ok=True)\n",
        "\n",
        "        # Initialize model\n",
        "        self.model = AdaptiveRespiratoryModel(\n",
        "            num_classes=configs[\"num_classes\"],\n",
        "            dropout=configs[\"dropout\"],\n",
        "            use_lora=configs.get(\"use_lora\", True),\n",
        "            lora_r=configs.get(\"lora_r\", 8),\n",
        "            lora_alpha=configs.get(\"lora_alpha\", 16),\n",
        "            lora_dropout=configs.get(\"lora_dropout\", 0.05),\n",
        "            lora_last_n_blocks=configs.get(\"lora_last_n_blocks\", 2),\n",
        "        ).to(self.configs[\"device\"])\n",
        "\n",
        "        # Create dataloaders\n",
        "        print(\"Creating dataloaders...\")\n",
        "        train_loader, val_loader, test_loader, class_weights, train_dataset = create_dataloaders_from_csv(\n",
        "            csv_dir=configs[\"csv_dir\"],\n",
        "            batch_size=configs[\"batch_size\"],\n",
        "            num_workers=configs.get(\"num_workers\", 2)\n",
        "        )\n",
        "\n",
        "        self.trainloader = train_loader\n",
        "        self.valloader = val_loader\n",
        "        self.testloader = test_loader\n",
        "        self.train_dataset = train_dataset\n",
        "        self.class_weights = class_weights.to(configs[\"device\"])\n",
        "        self.class_names = [train_dataset.idx_to_class[i] for i in range(configs[\"num_classes\"])]\n",
        "\n",
        "        # Training history\n",
        "        # load or create history\n",
        "        history_path = os.path.join(self.configs[\"logdir\"], \"history.json\")\n",
        "        if os.path.exists(history_path):\n",
        "            with open(history_path, \"r\") as f:\n",
        "                self.history = json.load(f)\n",
        "                if \"thresholds\" not in self.history:\n",
        "                    self.history[\"thresholds\"] = []\n",
        "        else:\n",
        "            self.history = {\n",
        "                \"train_loss\": [],\n",
        "                \"train_acc\": [],\n",
        "                \"train_f1\": [],\n",
        "                \"val_loss\": [],\n",
        "                \"val_acc\": [],\n",
        "                \"val_f1\": [],\n",
        "                \"val_auc_macro\":[],\n",
        "                \"val_auc_micro\":[],\n",
        "                \"val_per_class_auc\":[],\n",
        "                \"lr\": [],\n",
        "                \"thresholds\":[]\n",
        "            }\n",
        "\n",
        "        # Loss function with class weights\n",
        "        alpha = torch.clamp(self.class_weights, max=5.0)\n",
        "        self.criterion = FocalLoss(gamma=2.0, alpha=None)\n",
        "\n",
        "        # Optimizer with different learning rates for LoRA and head\n",
        "        lora_params, head_params = [], []\n",
        "        for n, p in self.model.named_parameters():\n",
        "            if not p.requires_grad:\n",
        "                continue\n",
        "            if \"lora_A\" in n or \"lora_B\" in n:\n",
        "                lora_params.append(p)\n",
        "            else:\n",
        "                head_params.append(p)\n",
        "\n",
        "        self.optimizer = torch.optim.AdamW([\n",
        "            {\"params\": head_params, \"lr\": self.configs[\"lr\"], \"weight_decay\": self.configs[\"weight_decay\"]},\n",
        "            {\"params\": lora_params, \"lr\": 0.1 * self.configs[\"lr\"], \"weight_decay\": self.configs[\"weight_decay\"]},\n",
        "        ])\n",
        "\n",
        "        # Learning rate schedulers\n",
        "\n",
        "        self.scheduler1 = torch.optim.lr_scheduler.LinearLR(            self.optimizer,\n",
        "            start_factor=0.1,\n",
        "            end_factor=1.0,\n",
        "            total_iters=configs[\"warmup\"]\n",
        "        )\n",
        "        self.scheduler2 = torch.optim.lr_scheduler.CosineAnnealingLR(\n",
        "            self.optimizer,eta_min=1e-6,\n",
        "            T_max=configs[\"num_epochs\"] - configs[\"warmup\"]\n",
        "        )\n",
        "        self.scheduler = torch.optim.lr_scheduler.SequentialLR(\n",
        "            self.optimizer,\n",
        "            schedulers=[self.scheduler1, self.scheduler2],\n",
        "            milestones=[configs[\"warmup\"]]\n",
        "        )\n",
        "        # Mixed precision training\n",
        "        self.scaler = torch.amp.GradScaler('cuda') if configs.get(\"use_amp\", True) else None\n",
        "\n",
        "        # Early stopping\n",
        "        self.early_stopping = EarlyStopping(\n",
        "            patience=configs.get(\"early_stopping_patience\", 10),\n",
        "            min_delta=configs.get(\"early_stopping_min_delta\", 0.001)\n",
        "        )\n",
        "\n",
        "        self.current_epoch = 0\n",
        "        self.best_val_f1 = 0.0\n",
        "        self.best_thresholds=[0.5]*configs[\"num_classes\"]\n",
        "\n",
        "        # Resume from checkpoint if exists\n",
        "        if os.path.exists(self.configs[\"resume\"]):\n",
        "            self.load_checkpoint(self.configs[\"resume\"])\n",
        "\n",
        "\n",
        "\n",
        "\n",
        "    def load_checkpoint(self, checkpoint_path):\n",
        "        \"\"\"Load model checkpoint\"\"\"\n",
        "        print(f\"Loading checkpoint from {checkpoint_path}\")\n",
        "        checkpoint = torch.load(checkpoint_path, map_location=self.configs[\"device\"],weights_only =False)\n",
        "\n",
        "        self.model.load_state_dict(checkpoint[\"model\"], strict=False)\n",
        "\n",
        "        if \"optimizer\" in checkpoint:\n",
        "            self.optimizer.load_state_dict(checkpoint[\"optimizer\"])\n",
        "        if \"scheduler\" in checkpoint:\n",
        "            self.scheduler.load_state_dict(checkpoint[\"scheduler\"])\n",
        "        if \"epoch\" in checkpoint:\n",
        "            self.current_epoch = checkpoint[\"epoch\"] + 1\n",
        "        if \"best_val_f1\" in checkpoint:\n",
        "            self.best_val_f1 = checkpoint[\"best_val_f1\"]\n",
        "        if \"thresholds\" in checkpoint:\n",
        "            self.best_thresholds = checkpoint[\"thresholds\"]\n",
        "\n",
        "\n",
        "        print(f\"Resumed from epoch {self.current_epoch}, best val f1: {self.best_val_f1:.4f}\")\n",
        "\n",
        "    def save_checkpoint(self, epoch, val_metric,thresholds, is_best=False):\n",
        "        \"\"\"Save model checkpoint\"\"\"\n",
        "        checkpoint = {\n",
        "            \"model\": self.model.state_dict(),\n",
        "            \"optimizer\": self.optimizer.state_dict(),\n",
        "            \"scheduler\": self.scheduler.state_dict(),\n",
        "            \"epoch\": epoch,\n",
        "            \"best_val_f1\": self.best_val_f1,\n",
        "            \"config\": self.configs,\n",
        "            \"thresholds\":thresholds\n",
        "        }\n",
        "\n",
        "        # Save regular checkpoint\n",
        "        checkpoint_path = os.path.join(\n",
        "            self.configs[\"logdir\"].replace(\"logs\", \"checkpoints\"),\n",
        "            f\"checkpoint_epoch_{epoch}.pth\"\n",
        "        )\n",
        "        torch.save(checkpoint, checkpoint_path)\n",
        "\n",
        "        # Save best checkpoint\n",
        "        if is_best:\n",
        "            best_path = self.configs[\"resume\"]\n",
        "            torch.save(checkpoint, best_path)\n",
        "            print(f\"✓ Best model saved: {best_path} (metric: {val_metric:.4f})\")\n",
        "\n",
        "    def train_epoch(self, epoch, looper):\n",
        "        \"\"\"Train for one epoch\"\"\"\n",
        "        self.model.train()\n",
        "        running_loss = 0.0\n",
        "        all_preds = []\n",
        "        all_labels = []\n",
        "        all_probs=[]\n",
        "        total_batches = len(self.trainloader)\n",
        "        accumulation = self.configs.get(\"accumulation\", 1)\n",
        "\n",
        "        self.optimizer.zero_grad(set_to_none=True)\n",
        "\n",
        "        for batch_idx, data in looper:\n",
        "            features = data['features'].to(self.configs[\"device\"], non_blocking=True)   # [B,T,1,192,128]\n",
        "            lengths  = data['lengths'].to(self.configs[\"device\"], non_blocking=True)   # [B]\n",
        "            labels = data['label'].to(self.configs[\"device\"], non_blocking=True)\n",
        "\n",
        "            # Mixed precision forward pass\n",
        "            if self.scaler is not None:\n",
        "                with torch.amp.autocast('cuda'):\n",
        "                    logits,attn = self.model(features, lengths)\n",
        "                    loss = self.criterion(logits, labels)\n",
        "\n",
        "                # Backward with gradient accumulation\n",
        "                loss_scaled = loss / accumulation\n",
        "                self.scaler.scale(loss_scaled).backward()\n",
        "\n",
        "                if (batch_idx + 1) % accumulation == 0 or batch_idx == total_batches - 1:\n",
        "                    # Gradient clipping\n",
        "                    self.scaler.unscale_(self.optimizer)\n",
        "                    torch.nn.utils.clip_grad_norm_(self.model.parameters(), max_norm=1.0)\n",
        "\n",
        "                    self.scaler.step(self.optimizer)\n",
        "                    self.scaler.update()\n",
        "                    self.optimizer.zero_grad(set_to_none=True)\n",
        "            else:\n",
        "                logits,attn = self.model(features,lengths)\n",
        "                loss = self.criterion(logits, labels)\n",
        "\n",
        "                loss_back = loss / accumulation\n",
        "                loss_back.backward()\n",
        "\n",
        "                if (batch_idx + 1) % accumulation == 0 or batch_idx == total_batches - 1:\n",
        "                    torch.nn.utils.clip_grad_norm_(self.model.parameters(), max_norm=1.0)\n",
        "                    self.optimizer.step()\n",
        "                    self.optimizer.zero_grad(set_to_none=True)\n",
        "\n",
        "            running_loss += loss.item()\n",
        "\n",
        "            # Collect predictions\n",
        "            probs = torch.softmax(logits.float(), dim=1)\n",
        "            preds = torch.argmax(probs, dim=1)\n",
        "\n",
        "            all_preds.extend(preds.detach().cpu().numpy())\n",
        "            all_labels.extend(labels.detach().cpu().numpy())\n",
        "            all_probs.extend(probs.detach().cpu().numpy())\n",
        "\n",
        "            # Update progress bar\n",
        "            current_loss = running_loss / (batch_idx + 1)\n",
        "            current_lr = self.optimizer.param_groups[0][\"lr\"]\n",
        "            looper.set_postfix({\n",
        "                \"lr\": f\"{current_lr:.2e}\",\n",
        "                \"batch\": f\"{batch_idx + 1}/{total_batches}\",\n",
        "                \"epoch\": f\"{epoch}/{self.configs['num_epochs']}\",\n",
        "                \"loss\": f\"{current_loss:.4f}\"\n",
        "            })\n",
        "        thresholds=find_best_thresholds_one_vs_rest(\n",
        "            probs=np.array(all_probs),\n",
        "            y_true=np.array(all_labels),\n",
        "            num_classes=self.configs[\"num_classes\"],\n",
        "            grid_size=101,\n",
        "            min_thr=0.05,\n",
        "            max_thr=0.95\n",
        "        )\n",
        "        # Calculate metrics\n",
        "        avg_loss = running_loss / total_batches\n",
        "        accuracy = accuracy_score(all_labels, all_preds)\n",
        "        f1 = f1_score(all_labels, all_preds, average='weighted')\n",
        "        all_probs = np.array(all_probs)\n",
        "        auc_score = self.calculate_auc_scores(all_labels, all_probs, average='macro')\n",
        "\n",
        "        return avg_loss, accuracy, f1,auc_score,thresholds.tolist()\n",
        "\n",
        "    def validate(self, epoch, looper):\n",
        "        \"\"\"Validate the model\"\"\"\n",
        "        self.model.eval()\n",
        "        running_loss = 0.0\n",
        "        all_preds = []\n",
        "        all_labels = []\n",
        "        all_probs = []\n",
        "\n",
        "        with torch.no_grad():\n",
        "            for batch_idx, data in looper:\n",
        "                features = data['features'].to(self.configs[\"device\"], non_blocking=True)\n",
        "                lengths  = data['lengths'].to(self.configs[\"device\"], non_blocking=True)   # [B]\n",
        "                labels = data['label'].to(self.configs[\"device\"], non_blocking=True)\n",
        "\n",
        "                if self.scaler is not None:\n",
        "                    with torch.amp.autocast('cuda'):\n",
        "                        logits,attn = self.model(features,lengths)\n",
        "                        loss = self.criterion(logits, labels)\n",
        "                else:\n",
        "                    logits,attn = self.model(features,lengths)\n",
        "                    loss = self.criterion(logits, labels)\n",
        "\n",
        "                running_loss += loss.item()\n",
        "\n",
        "                # Get predictions and probabilities\n",
        "                probs = torch.softmax(logits.float(), dim=1)\n",
        "                #preds = torch.argmax(probs, dim=1)\n",
        "                preds = predict_with_thresholds(\n",
        "                    probs.cpu(),\n",
        "                    np.array(self.best_thresholds, dtype=np.float32)\n",
        "                )\n",
        "                all_preds.extend(preds.detach().cpu().numpy())\n",
        "                all_labels.extend(labels.detach().cpu().numpy())\n",
        "                all_probs.extend(probs.detach().cpu().numpy())\n",
        "\n",
        "                # Update progress bar\n",
        "                current_loss = running_loss / (batch_idx + 1)\n",
        "                looper.set_postfix({\n",
        "                    \"epoch\": f\"{epoch}/{self.configs['num_epochs']}\",\n",
        "                    \"batch\": f\"{batch_idx + 1}/{len(self.valloader)}\",\n",
        "                    \"loss\": f\"{current_loss:.4f}\"\n",
        "                })\n",
        "\n",
        "\n",
        "\n",
        "        avg_loss = running_loss / len(self.valloader)\n",
        "        accuracy = accuracy_score(all_labels, all_preds)\n",
        "        f1_weighted = f1_score(all_labels, all_preds, average='weighted')\n",
        "        f1_macro = f1_score(all_labels, all_preds, average='macro')\n",
        "        precision = precision_score(all_labels, all_preds, average='weighted', zero_division=0)\n",
        "        recall = recall_score(all_labels, all_preds, average='weighted', zero_division=0)\n",
        "        all_probs = np.array(all_probs)\n",
        "        auc_macro = self.calculate_auc_scores(all_labels, all_probs, average='macro')\n",
        "        auc_micro = self.calculate_auc_scores(all_labels, all_probs, average='micro')\n",
        "        per_class_auc = self.calculate_per_class_auc(all_labels, all_probs)\n",
        "\n",
        "        metrics = {\n",
        "            'loss': avg_loss,\n",
        "            'accuracy': accuracy,\n",
        "            'f1_weighted': f1_weighted,\n",
        "            'f1_macro': f1_macro,\n",
        "            'precision': precision,\n",
        "            'recall': recall,\n",
        "            'preds': all_preds,\n",
        "            'labels': all_labels,\n",
        "            'probs': all_probs,\n",
        "            'val_auc_macro': auc_macro,\n",
        "            'val_auc_micro': auc_micro,\n",
        "            'per_class_auc': per_class_auc\n",
        "        }\n",
        "\n",
        "        return metrics\n",
        "\n",
        "    def train(self):\n",
        "        \"\"\"Main training loop\"\"\"\n",
        "        print(f\"\\n{'='*80}\")\n",
        "        print(\"STARTING TRAINING\")\n",
        "        print(f\"{'='*80}\\n\")\n",
        "\n",
        "        for epoch in range(self.current_epoch, self.configs[\"num_epochs\"]):\n",
        "            print(f\"\\nEpoch {epoch + 1}/{self.configs['num_epochs']}\")\n",
        "            print(\"-\" * 80)\n",
        "\n",
        "            # Train\n",
        "            train_looper = tqdm(\n",
        "                enumerate(self.trainloader),\n",
        "                total=len(self.trainloader),\n",
        "                desc=\"Training\",\n",
        "                file=self.traintee\n",
        "            )\n",
        "            train_loss, train_acc, train_f1,train_macro_auc,thresholds = self.train_epoch(epoch, train_looper)\n",
        "            print(f\"train_loss {train_loss}, train_acc {train_acc}, train_f1 {train_f1},train_macro_auc {train_macro_auc}\")\n",
        "\n",
        "            # Validate\n",
        "            val_looper = tqdm(\n",
        "                enumerate(self.valloader),\n",
        "                total=len(self.valloader),\n",
        "                desc=\"Validation\",\n",
        "                file=self.valtee\n",
        "            )\n",
        "            val_metrics = self.validate(epoch, val_looper)\n",
        "\n",
        "            # Update learning rate\n",
        "            self.scheduler.step()\n",
        "            current_lr = self.optimizer.param_groups[0][\"lr\"]\n",
        "\n",
        "            # Update history\n",
        "            self.history[\"train_loss\"].append(float(train_loss))\n",
        "            self.history[\"train_acc\"].append(float(train_acc))\n",
        "            self.history[\"train_f1\"].append(float(train_f1))\n",
        "            self.history[\"val_loss\"].append(float(val_metrics['loss']))\n",
        "            self.history[\"val_acc\"].append(float(val_metrics['accuracy']))\n",
        "            self.history[\"val_f1\"].append(float(val_metrics['f1_weighted']))\n",
        "            self.history[\"lr\"].append(float(current_lr))\n",
        "            self.history[\"val_auc_macro\"].append(float(val_metrics['val_auc_macro']))\n",
        "            self.history[\"val_auc_micro\"].append(float(val_metrics['val_auc_micro']))\n",
        "            self.history[\"val_per_class_auc\"].append(val_metrics['per_class_auc'])\n",
        "            self.history[\"thresholds\"].append(thresholds)\n",
        "\n",
        "            # Print metrics\n",
        "            print(f\"\\nEpoch {epoch + 1} Summary:\")\n",
        "            print(f\"  Train Loss: {train_loss:.4f} | Acc: {train_acc:.4f} | F1: {train_f1:.4f}\")\n",
        "            print(f\"  Val Loss: {val_metrics['loss']:.4f} | Acc: {val_metrics['accuracy']:.4f} | F1: {val_metrics['f1_weighted']:.4f}\")\n",
        "            print(f\"  Val F1 (macro): {val_metrics['f1_macro']:.4f} | Precision: {val_metrics['precision']:.4f} | Recall: {val_metrics['recall']:.4f} | auc macro {val_metrics['val_auc_macro']} | auc micro {val_metrics['val_auc_micro']} \")\n",
        "            print(f\"  Per-class AUC: {val_metrics['per_class_auc']}\")\n",
        "            print(f\"  Learning Rate: {current_lr:.2e}\")\n",
        "\n",
        "            # Save checkpoint if best\n",
        "            is_best = val_metrics['f1_weighted'] > self.best_val_f1\n",
        "            if is_best:\n",
        "                self.best_val_f1 = val_metrics['f1_weighted']\n",
        "                self.best_thresholds = thresholds\n",
        "\n",
        "\n",
        "            self.save_checkpoint(epoch, val_metrics['f1_weighted'],self.best_thresholds , is_best=is_best)\n",
        "\n",
        "            # Save history\n",
        "            history_path = os.path.join(self.configs[\"logdir\"], \"history.json\")\n",
        "            with open(history_path, \"w\") as f:\n",
        "                json.dump(self.history, f, indent=2)\n",
        "\n",
        "            # Plot metrics every N epochs\n",
        "            if (epoch + 1) % 5 == 0:\n",
        "                self.plot_training_metrics(epoch + 1)\n",
        "                self.plot_confusion_matrix(\n",
        "                    val_metrics['labels'],\n",
        "                    val_metrics['preds'],\n",
        "                    epoch + 1\n",
        "                )\n",
        "\n",
        "            # Early stopping check\n",
        "            if self.early_stopping(val_metrics[\"f1_weighted\"]):\n",
        "                print(f\"\\n{'='*80}\")\n",
        "                print(f\"Early stopping triggered at epoch {epoch + 1}\")\n",
        "                print(f\"Best validation F1: {self.best_val_f1:.4f}\")\n",
        "                print(f\"{'='*80}\\n\")\n",
        "                break\n",
        "\n",
        "        print(f\"\\n{'='*80}\")\n",
        "        print(\"TRAINING COMPLETED\")\n",
        "        print(f\"Best validation F1: {self.best_val_f1:.4f}\")\n",
        "        print(f\"{'='*80}\\n\")\n",
        "\n",
        "    def calculate_auc_scores(self, labels, probs, average='macro'):\n",
        "        \"\"\"\n",
        "        Calculate AUC scores for multi-class classification.\n",
        "        Handles missing classes gracefully.\n",
        "\n",
        "        Args:\n",
        "            labels: True labels (1D array)\n",
        "            probs: Predicted probabilities (2D array: samples x classes)\n",
        "            average: 'macro', 'micro', or 'weighted'\n",
        "\n",
        "        Returns:\n",
        "            AUC score(s)\n",
        "        \"\"\"\n",
        "        try:\n",
        "            # For binary case\n",
        "            if len(self.class_names) == 2:\n",
        "                auc_score = roc_auc_score(labels, probs[:, 1])\n",
        "                return auc_score\n",
        "\n",
        "            # Check if we have at least 2 classes\n",
        "            present_classes = np.unique(labels)\n",
        "            if len(present_classes) < 2:\n",
        "                print(f\"Warning: Only {len(present_classes)} class present. Need at least 2.\")\n",
        "                return 0.0\n",
        "\n",
        "            # Binarize labels for one-vs-rest\n",
        "            labels_bin = label_binarize(labels, classes=range(len(self.class_names)))\n",
        "\n",
        "            # Calculate per-class AUC for present classes only\n",
        "            auc_scores = []\n",
        "            class_counts = []\n",
        "\n",
        "            for i in present_classes:\n",
        "                try:\n",
        "                    # Check if this class has both positive and negative samples\n",
        "                    if labels_bin[:, i].sum() > 0 and labels_bin[:, i].sum() < len(labels_bin):\n",
        "                        class_auc = roc_auc_score(labels_bin[:, i], probs[:, i])\n",
        "                        auc_scores.append(class_auc)\n",
        "                        class_counts.append((labels == i).sum())\n",
        "                except Exception as e:\n",
        "                    print(f\"Warning: Could not calculate AUC for class {i} ({self.class_names[i]}): {e}\")\n",
        "                    continue\n",
        "\n",
        "            if not auc_scores:\n",
        "                print(\"Warning: Could not calculate AUC for any class\")\n",
        "                return 0.0\n",
        "\n",
        "            # Apply averaging\n",
        "            if average == 'macro':\n",
        "                # Unweighted mean of per-class AUCs\n",
        "                return np.mean(auc_scores)\n",
        "            elif average == 'weighted':\n",
        "                # Weighted by class frequency\n",
        "                weights = np.array(class_counts) / sum(class_counts)\n",
        "                return np.average(auc_scores, weights=weights)\n",
        "            elif average == 'micro':\n",
        "                # Micro-averaging: aggregate all classes then calculate AUC\n",
        "                # Flatten the binary labels and probabilities for all present classes\n",
        "                all_labels = []\n",
        "                all_probs = []\n",
        "                for i in present_classes:\n",
        "                    all_labels.extend(labels_bin[:, i])\n",
        "                    all_probs.extend(probs[:, i])\n",
        "                return roc_auc_score(all_labels, all_probs)\n",
        "            else:\n",
        "                return np.mean(auc_scores)\n",
        "\n",
        "        except Exception as e:\n",
        "            print(f\"Warning: Could not calculate AUC - {e}\")\n",
        "            import traceback\n",
        "            traceback.print_exc()\n",
        "            return 0.0\n",
        "\n",
        "    def calculate_per_class_auc(self, labels, probs):\n",
        "        \"\"\"\n",
        "        Calculate AUC for each class separately.\n",
        "\n",
        "        Returns:\n",
        "            Dictionary mapping class names to AUC scores\n",
        "        \"\"\"\n",
        "        per_class_auc = {}\n",
        "\n",
        "        # Binarize labels for one-vs-rest\n",
        "        labels_bin = label_binarize(labels, classes=range(len(self.class_names)))\n",
        "\n",
        "        for i, class_name in enumerate(self.class_names):\n",
        "            try:\n",
        "                if labels_bin.shape[1] == 1:  # Binary case\n",
        "                    auc_score = roc_auc_score(labels, probs[:, 1])\n",
        "                else:\n",
        "                    auc_score = roc_auc_score(labels_bin[:, i], probs[:, i])\n",
        "                per_class_auc[class_name] = auc_score\n",
        "            except Exception as e:\n",
        "                print(f\"Warning: Could not calculate AUC for {class_name} - {e}\")\n",
        "                per_class_auc[class_name] = 0.0\n",
        "\n",
        "        return per_class_auc\n",
        "\n",
        "    def plot_training_metrics(self, epoch):\n",
        "        \"\"\"Plot training metrics\"\"\"\n",
        "        save_dir = os.path.join(self.configs[\"logdir\"], \"figures\", f\"epoch_{epoch}\")\n",
        "        os.makedirs(save_dir, exist_ok=True)\n",
        "\n",
        "        epochs = list(range(1, len(self.history[\"train_loss\"]) + 1))\n",
        "\n",
        "        # Plot 1: Loss curves\n",
        "        plt.figure(figsize=(10, 6))\n",
        "        plt.plot(epochs, self.history[\"train_loss\"], label=\"Train Loss\", linewidth=2.5, color='blue')\n",
        "        plt.plot(epochs, self.history[\"val_loss\"], label=\"Val Loss\", linewidth=2.5, color='orange')\n",
        "        plt.xlabel(\"Epoch\", fontsize=12)\n",
        "        plt.ylabel(\"Loss\", fontsize=12)\n",
        "        plt.title(\"Training & Validation Loss\", fontsize=14, fontweight='bold')\n",
        "        plt.legend(fontsize=11)\n",
        "        plt.grid(True, linestyle='--', alpha=0.6)\n",
        "        plt.tight_layout()\n",
        "        plt.savefig(os.path.join(save_dir, \"loss_curves.png\"), dpi=150)\n",
        "        plt.close()\n",
        "\n",
        "        # Plot 2: Accuracy curves\n",
        "        plt.figure(figsize=(10, 6))\n",
        "        plt.plot(epochs, self.history[\"train_acc\"], label=\"Train Accuracy\", linewidth=2.5, color='blue')\n",
        "        plt.plot(epochs, self.history[\"val_acc\"], label=\"Val Accuracy\", linewidth=2.5, color='orange')\n",
        "        plt.xlabel(\"Epoch\", fontsize=12)\n",
        "        plt.ylabel(\"Accuracy\", fontsize=12)\n",
        "        plt.title(\"Training & Validation Accuracy\", fontsize=14, fontweight='bold')\n",
        "        plt.legend(fontsize=11)\n",
        "        plt.grid(True, linestyle='--', alpha=0.6)\n",
        "        plt.tight_layout()\n",
        "        plt.savefig(os.path.join(save_dir, \"accuracy_curves.png\"), dpi=150)\n",
        "        plt.close()\n",
        "\n",
        "        # Plot 3: F1 Score curves\n",
        "        plt.figure(figsize=(10, 6))\n",
        "        plt.plot(epochs, self.history[\"train_f1\"], label=\"Train F1\", linewidth=2.5, color='blue')\n",
        "        plt.plot(epochs, self.history[\"val_f1\"], label=\"Val F1\", linewidth=2.5, color='orange')\n",
        "        plt.xlabel(\"Epoch\", fontsize=12)\n",
        "        plt.ylabel(\"F1 Score\", fontsize=12)\n",
        "        plt.title(\"Training & Validation F1 Score\", fontsize=14, fontweight='bold')\n",
        "        plt.legend(fontsize=11)\n",
        "        plt.grid(True, linestyle='--', alpha=0.6)\n",
        "        plt.tight_layout()\n",
        "        plt.savefig(os.path.join(save_dir, \"f1_curves.png\"), dpi=150)\n",
        "        plt.close()\n",
        "\n",
        "        # Plot 4: Learning rate\n",
        "        plt.figure(figsize=(10, 6))\n",
        "        plt.plot(epochs, self.history[\"lr\"], linewidth=2.5, color='green')\n",
        "        plt.xlabel(\"Epoch\", fontsize=12)\n",
        "        plt.ylabel(\"Learning Rate\", fontsize=12)\n",
        "        plt.title(\"Learning Rate Schedule\", fontsize=14, fontweight='bold')\n",
        "        plt.yscale('log')\n",
        "        plt.grid(True, linestyle='--', alpha=0.6)\n",
        "        plt.tight_layout()\n",
        "        plt.savefig(os.path.join(save_dir, \"learning_rate.png\"), dpi=150)\n",
        "        plt.close()\n",
        "\n",
        "    def plot_confusion_matrix(self, labels, preds, epoch):\n",
        "        \"\"\"Plot confusion matrix\"\"\"\n",
        "        save_dir = os.path.join(self.configs[\"logdir\"], \"figures\", f\"epoch_{epoch}\")\n",
        "        os.makedirs(save_dir, exist_ok=True)\n",
        "\n",
        "        # Compute confusion matrix\n",
        "        cm = confusion_matrix(labels, preds)\n",
        "\n",
        "        # Normalize\n",
        "        cm_normalized = cm.astype('float') / cm.sum(axis=1)[:, np.newaxis]\n",
        "\n",
        "        # Plot\n",
        "        plt.figure(figsize=(12, 10))\n",
        "        sns.heatmap(\n",
        "            cm_normalized,\n",
        "            annot=True,\n",
        "            fmt='.2f',\n",
        "            cmap='Blues',\n",
        "            xticklabels=self.class_names,\n",
        "            yticklabels=self.class_names,\n",
        "            cbar_kws={'label': 'Normalized Count'}\n",
        "        )\n",
        "        plt.xlabel(\"Predicted\", fontsize=12)\n",
        "        plt.ylabel(\"True\", fontsize=12)\n",
        "        plt.title(\"Confusion Matrix (Normalized)\", fontsize=14, fontweight='bold')\n",
        "        plt.xticks(rotation=45, ha='right')\n",
        "        plt.yticks(rotation=0)\n",
        "        plt.tight_layout()\n",
        "        plt.savefig(os.path.join(save_dir, \"confusion_matrix.png\"), dpi=150)\n",
        "        plt.close()\n",
        "\n",
        "        # Save classification report\n",
        "        report = classification_report(\n",
        "            labels,\n",
        "            preds,\n",
        "            target_names=self.class_names,\n",
        "            digits=4\n",
        "        )\n",
        "        report_path = os.path.join(save_dir, \"classification_report.txt\")\n",
        "        with open(report_path, 'w') as f:\n",
        "            f.write(report)\n",
        "\n",
        "    def test(self, model_path: Optional[str] = None):\n",
        "        \"\"\"Test the model\"\"\"\n",
        "        if model_path is None:\n",
        "            model_path = self.configs[\"resume\"]\n",
        "\n",
        "        print(f\"\\n{'='*80}\")\n",
        "        print(\"TESTING MODEL\")\n",
        "        print(f\"{'='*80}\\n\")\n",
        "        print(f\"Loading model from: {model_path}\")\n",
        "\n",
        "        checkpoint = torch.load(model_path, map_location=self.configs[\"device\"],weights_only =False)\n",
        "        self.model.load_state_dict(checkpoint[\"model\"], strict=False)\n",
        "        self.model.eval()\n",
        "\n",
        "        all_preds = []\n",
        "        all_labels = []\n",
        "        all_probs = []\n",
        "        all_filenames = []\n",
        "\n",
        "        with torch.no_grad():\n",
        "            for data in tqdm(self.testloader, desc=\"Testing\", file=self.testtee):\n",
        "                features = data['features'].to(self.configs[\"device\"], non_blocking=True)\n",
        "                lengths  = data['lengths'].to(self.configs[\"device\"], non_blocking=True)   # [B]\n",
        "                labels = data['label'].to(self.configs[\"device\"], non_blocking=True)\n",
        "\n",
        "                if self.scaler is not None:\n",
        "                    with torch.amp.autocast('cuda'):\n",
        "                        logits,_ = self.model(features,lengths)\n",
        "                else:\n",
        "                    logits,_ = self.model(features,lengths)\n",
        "\n",
        "                probs = torch.softmax(logits.float(), dim=1)\n",
        "                #preds = torch.argmax(probs, dim=1)\n",
        "                preds = predict_with_thresholds(\n",
        "                    probs.cpu(),\n",
        "                    np.array(self.best_thresholds, dtype=np.float32)\n",
        "                )\n",
        "\n",
        "\n",
        "                all_preds.extend(preds.detach().cpu().numpy())\n",
        "                all_labels.extend(labels.detach().cpu().numpy())\n",
        "                all_probs.extend(probs.detach().cpu().numpy())\n",
        "                all_filenames.extend(data['filename'])\n",
        "\n",
        "        # Calculate metrics\n",
        "        accuracy = accuracy_score(all_labels, all_preds)\n",
        "        f1_weighted = f1_score(all_labels, all_preds, average='weighted')\n",
        "        f1_macro = f1_score(all_labels, all_preds, average='macro')\n",
        "        precision = precision_score(all_labels, all_preds, average='weighted', zero_division=0)\n",
        "        recall = recall_score(all_labels, all_preds, average='weighted', zero_division=0)\n",
        "        all_probs = np.array(all_probs)\n",
        "        auc_macro = self.calculate_auc_scores(all_labels, all_probs, average='macro')\n",
        "        auc_micro = self.calculate_auc_scores(all_labels, all_probs, average='micro')\n",
        "        per_class_auc = self.calculate_per_class_auc(all_labels, all_probs)\n",
        "\n",
        "        print(f\"\\n{'='*80}\")\n",
        "        print(\"TEST RESULTS\")\n",
        "        print(f\"{'='*80}\")\n",
        "        print(f\"Accuracy: {accuracy:.4f}\")\n",
        "        print(f\"F1 (weighted): {f1_weighted:.4f}\")\n",
        "        print(f\"F1 (macro): {f1_macro:.4f}\")\n",
        "        print(f\"Precision: {precision:.4f}\")\n",
        "        print(f\"Recall: {recall:.4f}\")\n",
        "        print(f\"AUC (macro): {auc_macro:.4f}\")\n",
        "        print(f\"AUC (micro): {auc_micro:.4f}\")\n",
        "        print(f\"Per-class AUC: {per_class_auc}\")\n",
        "        print(f\"{'='*80}\\n\")\n",
        "\n",
        "        # Detailed classification report\n",
        "        report = classification_report(\n",
        "            all_labels,\n",
        "            all_preds,\n",
        "            target_names=self.class_names,\n",
        "            digits=4\n",
        "        )\n",
        "        print(\"\\nClassification Report:\")\n",
        "        print(report)\n",
        "\n",
        "        # Save results\n",
        "        test_results_dir = os.path.join(self.configs[\"logdir\"], \"test_results\")\n",
        "        os.makedirs(test_results_dir, exist_ok=True)\n",
        "\n",
        "        # Save classification report\n",
        "        with open(os.path.join(test_results_dir, \"classification_report.txt\"), 'w') as f:\n",
        "            f.write(report)\n",
        "\n",
        "        # Save confusion matrix\n",
        "        cm = confusion_matrix(all_labels, all_preds)\n",
        "        cm_normalized = cm.astype('float') / cm.sum(axis=1)[:, np.newaxis]\n",
        "\n",
        "        plt.figure(figsize=(12, 10))\n",
        "        sns.heatmap(\n",
        "            cm_normalized,\n",
        "            annot=True,\n",
        "            fmt='.2f',\n",
        "            cmap='Blues',\n",
        "            xticklabels=self.class_names,\n",
        "            yticklabels=self.class_names\n",
        "        )\n",
        "        plt.xlabel(\"Predicted\")\n",
        "        plt.ylabel(\"True\")\n",
        "        plt.title(\"Test Set Confusion Matrix (Normalized)\")\n",
        "        plt.tight_layout()\n",
        "        plt.savefig(os.path.join(test_results_dir, \"confusion_matrix.png\"), dpi=150)\n",
        "        plt.close()\n",
        "\n",
        "        # Save predictions\n",
        "        results_df = pd.DataFrame({\n",
        "            'filename': all_filenames,\n",
        "            'true_label': [self.class_names[l] for l in all_labels],\n",
        "            'pred_label': [self.class_names[p] for p in all_preds],\n",
        "            'correct': [l == p for l, p in zip(all_labels, all_preds)]\n",
        "        })\n",
        "\n",
        "        # Add probabilities for each class\n",
        "        for i, class_name in enumerate(self.class_names):\n",
        "            results_df[f'prob_{class_name}'] = [probs[i] for probs in all_probs]\n",
        "\n",
        "        results_df.to_csv(os.path.join(test_results_dir, \"predictions.csv\"), index=False)\n",
        "\n",
        "        # Save metrics\n",
        "        metrics = {\n",
        "            'accuracy': float(accuracy),\n",
        "            'f1_weighted': float(f1_weighted),\n",
        "            'f1_macro': float(f1_macro),\n",
        "            'precision': float(precision),\n",
        "            'recall': float(recall)\n",
        "        }\n",
        "\n",
        "        with open(os.path.join(test_results_dir, \"metrics.json\"), 'w') as f:\n",
        "            json.dump(metrics, f, indent=2)\n",
        "\n",
        "        return metrics\n",
        "\n",
        "\n",
        "class EarlyStopping:\n",
        "    \"\"\"Early stopping to prevent overfitting\"\"\"\n",
        "    def __init__(self, patience=5, min_delta=0.001):\n",
        "        self.patience = patience\n",
        "        self.min_delta = min_delta\n",
        "        self.counter = 0\n",
        "        self.best_loss = None\n",
        "        self.early_stop = False\n",
        "\n",
        "    def __call__(self, val_loss):\n",
        "        if self.best_loss is None:\n",
        "            self.best_loss = val_loss\n",
        "        elif val_loss > self.best_loss - self.min_delta:\n",
        "            self.counter += 1\n",
        "            print(f\"EarlyStopping counter: {self.counter}/{self.patience}\")\n",
        "            if self.counter >= self.patience:\n",
        "                self.early_stop = True\n",
        "                return True\n",
        "        else:\n",
        "            self.best_loss = val_loss\n",
        "            self.counter = 0\n",
        "        return False\n",
        "\n",
        "\n",
        "class TeeFile:\n",
        "    \"\"\"File-like object that writes to multiple streams\"\"\"\n",
        "    def __init__(self, *file_objects_or_paths):\n",
        "        self.files = []\n",
        "        self.opened_files = []\n",
        "\n",
        "        for item in file_objects_or_paths:\n",
        "            if isinstance(item, str):\n",
        "                f = open(item, 'a', buffering=1)\n",
        "                self.files.append(f)\n",
        "                self.opened_files.append(f)\n",
        "            else:\n",
        "                self.files.append(item)\n",
        "\n",
        "    def write(self, data):\n",
        "        for f in self.files:\n",
        "            try:\n",
        "                f.write(data)\n",
        "                f.flush()\n",
        "            except Exception as e:\n",
        "                print(f\"Warning: Could not write to {f}: {e}\", file=sys.stderr)\n",
        "\n",
        "    def flush(self):\n",
        "        for f in self.files:\n",
        "            try:\n",
        "                f.flush()\n",
        "            except:\n",
        "                pass\n",
        "\n",
        "    def isatty(self):\n",
        "        return any(getattr(f, \"isatty\", lambda: False)() for f in self.files)\n",
        "\n",
        "    def close(self):\n",
        "        for f in self.opened_files:\n",
        "            try:\n",
        "                f.close()\n",
        "            except:\n",
        "                pass\n",
        "        self.opened_files.clear()\n",
        "\n",
        "    def __del__(self):\n",
        "        self.close()\n",
        "\n",
        "    def __enter__(self):\n",
        "        return self\n",
        "\n",
        "    def __exit__(self, exc_type, exc_val, exc_tb):\n",
        "        self.close()\n",
        "        return False\n",
        "\n",
        "\n",
        "# Example usage\n",
        "if __name__ == '__main__':\n",
        "    # Configuration\n",
        "    root = \"/content/drive/MyDrive/SPRSound/SPRSound-main\"\n",
        "\n",
        "    config = {\n",
        "        # Paths\n",
        "        \"csv_dir\": root,\n",
        "        \"logdir\": os.path.join(root, \"logs\"),\n",
        "        \"resume\": os.path.join(root, \"checkpoints\", \"best_model.pth\"),\n",
        "        \"dirsToMake\": [\n",
        "            os.path.join(root, \"checkpoints\"),\n",
        "            os.path.join(root, \"logs\"),\n",
        "            os.path.join(root, \"logs\", \"figures\")\n",
        "        ],\n",
        "\n",
        "        # Model\n",
        "        \"num_classes\": 2,  # normal, abnormal\n",
        "        \"dropout\": 0.4,\n",
        "        \"use_lora\": True,\n",
        "        \"lora_r\": 16,\n",
        "        \"lora_alpha\": 16,\n",
        "        \"lora_dropout\": 0.3,\n",
        "        \"lora_last_n_blocks\": 6,\n",
        "\n",
        "        # Training\n",
        "        \"lr\": 5e-5,\n",
        "        \"weight_decay\": 0.2,\n",
        "        \"warmup\": 10,\n",
        "        \"num_epochs\": 100,\n",
        "        \"batch_size\": 96,\n",
        "        \"accumulation\": 1,\n",
        "        \"use_amp\": False,\n",
        "        \"num_workers\": 2,\n",
        "\n",
        "        # Early stopping\n",
        "        \"early_stopping_patience\": 20,\n",
        "        \"early_stopping_min_delta\": 0.001,\n",
        "\n",
        "\n",
        "        # Device\n",
        "        \"device\": torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\"),\n",
        "    }\n",
        "\n",
        "    # Create trainer\n",
        "    trainer = RespiratoryTrainer(config)\n",
        "    if train_mode:\n",
        "      # Train\n",
        "      trainer.train()\n",
        "    elif test_mode:\n",
        "      # Test\n",
        "      trainer.test()"
      ]
    }
  ],
  "metadata": {
    "accelerator": "GPU",
    "colab": {
      "gpuType": "A100",
      "machine_shape": "hm",
      "provenance": []
    },
    "kernelspec": {
      "display_name": "Python 3",
      "name": "python3"
    },
    "language_info": {
      "name": "python"
    },
    "widgets": {
      "application/vnd.jupyter.widget-state+json": {
        "024be6229952428ab2864b3eb55dc117": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "05c3aa1ba9b84307bb8c6d4139fd4265": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "FloatProgressModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "FloatProgressModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "ProgressView",
            "bar_style": "success",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_066987f87c5b40758d7175504e83566d",
            "max": 392,
            "min": 0,
            "orientation": "horizontal",
            "style": "IPY_MODEL_a61d354d50a3444388629ce15de0d1c2",
            "value": 392
          }
        },
        "066987f87c5b40758d7175504e83566d": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "1370324eb86f47e785b4a1e04896e6b1": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "16ec7b6cf9884aa2a1a77f5dfcb65d7c": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "2cf91b6aad244705a9721b8704290d4b": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "2f2fa263a30e4ed1b80c06d41b13a29b": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "2fd3c35342ff4fd0b72fbed909bb6cda": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "3c95f65fafad4071ad9a16fdfd2ddab7": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "3e76226dc5f244d09c6ae03b074a505f": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_47ead54cc29e4bb79e520462e69116d3",
            "placeholder": "​",
            "style": "IPY_MODEL_2f2fa263a30e4ed1b80c06d41b13a29b",
            "value": "Loading weights: 100%"
          }
        },
        "47ead54cc29e4bb79e520462e69116d3": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "48a0e4b5fa85417a92f38b44b162849c": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "4cfb4d1f8ea54afa86ff3ce32a4889db": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "4d3b0629e80a4449870a784b5b62786b": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "817e5330a42748878c92829bbde7a9cd": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "ProgressStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "ProgressStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "bar_color": null,
            "description_width": ""
          }
        },
        "8a806bdafb6046b18ce57d80ad413040": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "8a9f0e5b71474967a27332869f7a1755": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "FloatProgressModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "FloatProgressModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "ProgressView",
            "bar_style": "success",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_16ec7b6cf9884aa2a1a77f5dfcb65d7c",
            "max": 533,
            "min": 0,
            "orientation": "horizontal",
            "style": "IPY_MODEL_817e5330a42748878c92829bbde7a9cd",
            "value": 533
          }
        },
        "8f6b4022643d4a2b85cf0ff7ca1d39ae": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "ProgressStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "ProgressStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "bar_color": null,
            "description_width": ""
          }
        },
        "a195f061dde54d0b84bf4bc7af03663f": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "a61d354d50a3444388629ce15de0d1c2": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "ProgressStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "ProgressStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "bar_color": null,
            "description_width": ""
          }
        },
        "a75cd80cecb54ec089a8de2fc59070a6": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HBoxModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HBoxModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HBoxView",
            "box_style": "",
            "children": [
              "IPY_MODEL_b9cd2cccec9140319ff16bdcc40a884b",
              "IPY_MODEL_aef1edfd1bf94319879409a909597dcd",
              "IPY_MODEL_bb31de74d6774fdb9bb15b24917e9b4d"
            ],
            "layout": "IPY_MODEL_e248e7c88b624c369ae18dee0e7d4c3d"
          }
        },
        "aef1edfd1bf94319879409a909597dcd": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "FloatProgressModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "FloatProgressModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "ProgressView",
            "bar_style": "success",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_4d3b0629e80a4449870a784b5b62786b",
            "max": 1212947234,
            "min": 0,
            "orientation": "horizontal",
            "style": "IPY_MODEL_8f6b4022643d4a2b85cf0ff7ca1d39ae",
            "value": 1212947234
          }
        },
        "b9cd2cccec9140319ff16bdcc40a884b": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_2cf91b6aad244705a9721b8704290d4b",
            "placeholder": "​",
            "style": "IPY_MODEL_e1dc8e90ba904e439af9eaa3f27aff8f",
            "value": "pytorch_model.bin: 100%"
          }
        },
        "b9f2f16c668b48efa2d019254d709dc3": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_2fd3c35342ff4fd0b72fbed909bb6cda",
            "placeholder": "​",
            "style": "IPY_MODEL_8a806bdafb6046b18ce57d80ad413040",
            "value": " 533/533 [00:00&lt;00:00, 65.4kB/s]"
          }
        },
        "bb31de74d6774fdb9bb15b24917e9b4d": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_a195f061dde54d0b84bf4bc7af03663f",
            "placeholder": "​",
            "style": "IPY_MODEL_3c95f65fafad4071ad9a16fdfd2ddab7",
            "value": " 1.21G/1.21G [00:03&lt;00:00, 709MB/s]"
          }
        },
        "c2fae8d5cbe54bbcbb93d5676f3b4db2": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_db97babd15c84f3f97822363e857de50",
            "placeholder": "​",
            "style": "IPY_MODEL_1370324eb86f47e785b4a1e04896e6b1",
            "value": "config.json: 100%"
          }
        },
        "c55f046386b7485188c5a23110e93630": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "d6b8c80f70e24e33b6c2104d82484004": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HBoxModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HBoxModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HBoxView",
            "box_style": "",
            "children": [
              "IPY_MODEL_c2fae8d5cbe54bbcbb93d5676f3b4db2",
              "IPY_MODEL_8a9f0e5b71474967a27332869f7a1755",
              "IPY_MODEL_b9f2f16c668b48efa2d019254d709dc3"
            ],
            "layout": "IPY_MODEL_4cfb4d1f8ea54afa86ff3ce32a4889db"
          }
        },
        "db97babd15c84f3f97822363e857de50": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "e1dc8e90ba904e439af9eaa3f27aff8f": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "e248e7c88b624c369ae18dee0e7d4c3d": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "e9895fad9318457a933fe6ce5e36cb5b": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_c55f046386b7485188c5a23110e93630",
            "placeholder": "​",
            "style": "IPY_MODEL_48a0e4b5fa85417a92f38b44b162849c",
            "value": " 392/392 [00:00&lt;00:00, 1510.87it/s, Materializing param=pooler.dense.weight]"
          }
        },
        "e9a5eaf20a8a49e495e90fad044b26fb": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HBoxModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HBoxModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HBoxView",
            "box_style": "",
            "children": [
              "IPY_MODEL_3e76226dc5f244d09c6ae03b074a505f",
              "IPY_MODEL_05c3aa1ba9b84307bb8c6d4139fd4265",
              "IPY_MODEL_e9895fad9318457a933fe6ce5e36cb5b"
            ],
            "layout": "IPY_MODEL_024be6229952428ab2864b3eb55dc117"
          }
        }
      }
    }
  },
  "nbformat": 4,
  "nbformat_minor": 0
}