{
  "model_path": "/home/ubuntu/groot_workspace/checkpoints/siglip2_decision_4class_state22_woidle_post1chunk/best_model.pt",
  "test_episodes": [
    4,
    5,
    14,
    19
  ],
  "require_next_class": true,
  "thresholds": [
    0.2,
    0.25,
    0.3,
    0.35,
    0.4,
    0.45,
    0.5,
    0.55,
    0.6,
    0.65,
    0.7
  ],
  "summaries": [
    {
      "early_switch_count": 0,
      "sequence_completion_rate": 0.75,
      "chunk_language_accuracy": 0.76171875,
      "frame_language_accuracy": 0.7460285614616118,
      "threshold": 0.2,
      "class_accuracy": 0.9955503512880562,
      "switch_macro_f1": 0.8983067854007274,
      "per_switch_f1": [
        0.8403361344537814,
        0.9142857142857143,
        0.9402985074626866
      ],
      "per_switch_recall": [
        0.78125,
        1.0,
        0.984375
      ],
      "episode_switch_delays": {
        "4": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 10
        },
        "5": {
          "0->1": 5,
          "1->2": 1,
          "2->3": 1
        },
        "14": {
          "0->1": null,
          "1->2": null,
          "2->3": null
        },
        "19": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 5
        }
      }
    },
    {
      "early_switch_count": 0,
      "sequence_completion_rate": 0.75,
      "chunk_language_accuracy": 0.76171875,
      "frame_language_accuracy": 0.7460285614616118,
      "threshold": 0.25,
      "class_accuracy": 0.9955503512880562,
      "switch_macro_f1": 0.8983067854007274,
      "per_switch_f1": [
        0.8403361344537814,
        0.9142857142857143,
        0.9402985074626866
      ],
      "per_switch_recall": [
        0.78125,
        1.0,
        0.984375
      ],
      "episode_switch_delays": {
        "4": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 10
        },
        "5": {
          "0->1": 5,
          "1->2": 1,
          "2->3": 1
        },
        "14": {
          "0->1": null,
          "1->2": null,
          "2->3": null
        },
        "19": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 5
        }
      }
    },
    {
      "early_switch_count": 0,
      "sequence_completion_rate": 0.75,
      "chunk_language_accuracy": 0.76171875,
      "frame_language_accuracy": 0.7460285614616118,
      "threshold": 0.3,
      "class_accuracy": 0.9955503512880562,
      "switch_macro_f1": 0.9006806162890149,
      "per_switch_f1": [
        0.847457627118644,
        0.9142857142857143,
        0.9402985074626866
      ],
      "per_switch_recall": [
        0.78125,
        1.0,
        0.984375
      ],
      "episode_switch_delays": {
        "4": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 10
        },
        "5": {
          "0->1": 5,
          "1->2": 1,
          "2->3": 1
        },
        "14": {
          "0->1": null,
          "1->2": null,
          "2->3": null
        },
        "19": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 5
        }
      }
    },
    {
      "early_switch_count": 0,
      "sequence_completion_rate": 0.75,
      "chunk_language_accuracy": 0.76171875,
      "frame_language_accuracy": 0.7460285614616118,
      "threshold": 0.35,
      "class_accuracy": 0.9955503512880562,
      "switch_macro_f1": 0.8973970197850795,
      "per_switch_f1": [
        0.8376068376068376,
        0.9142857142857143,
        0.9402985074626866
      ],
      "per_switch_recall": [
        0.765625,
        1.0,
        0.984375
      ],
      "episode_switch_delays": {
        "4": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 10
        },
        "5": {
          "0->1": 5,
          "1->2": 1,
          "2->3": 1
        },
        "14": {
          "0->1": null,
          "1->2": null,
          "2->3": null
        },
        "19": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 5
        }
      }
    },
    {
      "early_switch_count": 0,
      "sequence_completion_rate": 0.75,
      "chunk_language_accuracy": 0.76171875,
      "frame_language_accuracy": 0.7460285614616118,
      "threshold": 0.4,
      "class_accuracy": 0.9955503512880562,
      "switch_macro_f1": 0.8940568095483176,
      "per_switch_f1": [
        0.8275862068965517,
        0.9142857142857143,
        0.9402985074626866
      ],
      "per_switch_recall": [
        0.75,
        1.0,
        0.984375
      ],
      "episode_switch_delays": {
        "4": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 10
        },
        "5": {
          "0->1": 5,
          "1->2": 1,
          "2->3": 1
        },
        "14": {
          "0->1": null,
          "1->2": null,
          "2->3": null
        },
        "19": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 5
        }
      }
    },
    {
      "early_switch_count": 0,
      "sequence_completion_rate": 0.75,
      "chunk_language_accuracy": 0.76171875,
      "frame_language_accuracy": 0.7460285614616118,
      "threshold": 0.45,
      "class_accuracy": 0.9955503512880562,
      "switch_macro_f1": 0.8940568095483176,
      "per_switch_f1": [
        0.8275862068965517,
        0.9142857142857143,
        0.9402985074626866
      ],
      "per_switch_recall": [
        0.75,
        1.0,
        0.984375
      ],
      "episode_switch_delays": {
        "4": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 10
        },
        "5": {
          "0->1": 5,
          "1->2": 1,
          "2->3": 1
        },
        "14": {
          "0->1": null,
          "1->2": null,
          "2->3": null
        },
        "19": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 5
        }
      }
    },
    {
      "early_switch_count": 0,
      "sequence_completion_rate": 0.75,
      "chunk_language_accuracy": 0.76171875,
      "frame_language_accuracy": 0.7460285614616118,
      "threshold": 0.5,
      "class_accuracy": 0.9955503512880562,
      "switch_macro_f1": 0.9010890266576999,
      "per_switch_f1": [
        0.8421052631578947,
        0.9208633093525179,
        0.9402985074626866
      ],
      "per_switch_recall": [
        0.75,
        1.0,
        0.984375
      ],
      "episode_switch_delays": {
        "4": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 10
        },
        "5": {
          "0->1": 5,
          "1->2": 1,
          "2->3": 1
        },
        "14": {
          "0->1": null,
          "1->2": null,
          "2->3": null
        },
        "19": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 5
        }
      }
    },
    {
      "early_switch_count": 0,
      "sequence_completion_rate": 0.75,
      "chunk_language_accuracy": 0.76171875,
      "frame_language_accuracy": 0.7460285614616118,
      "threshold": 0.55,
      "class_accuracy": 0.9955503512880562,
      "switch_macro_f1": 0.8941967960812587,
      "per_switch_f1": [
        0.8214285714285714,
        0.9208633093525179,
        0.9402985074626866
      ],
      "per_switch_recall": [
        0.71875,
        1.0,
        0.984375
      ],
      "episode_switch_delays": {
        "4": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 10
        },
        "5": {
          "0->1": 5,
          "1->2": 1,
          "2->3": 1
        },
        "14": {
          "0->1": null,
          "1->2": null,
          "2->3": null
        },
        "19": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 5
        }
      }
    },
    {
      "early_switch_count": 0,
      "sequence_completion_rate": 0.75,
      "chunk_language_accuracy": 0.76171875,
      "frame_language_accuracy": 0.7460285614616118,
      "threshold": 0.6,
      "class_accuracy": 0.9955503512880562,
      "switch_macro_f1": 0.8990201864113261,
      "per_switch_f1": [
        0.8288288288288289,
        0.9208633093525179,
        0.9473684210526315
      ],
      "per_switch_recall": [
        0.71875,
        1.0,
        0.984375
      ],
      "episode_switch_delays": {
        "4": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 10
        },
        "5": {
          "0->1": 5,
          "1->2": 1,
          "2->3": 1
        },
        "14": {
          "0->1": null,
          "1->2": null,
          "2->3": null
        },
        "19": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 5
        }
      }
    },
    {
      "early_switch_count": 0,
      "sequence_completion_rate": 0.75,
      "chunk_language_accuracy": 0.76171875,
      "frame_language_accuracy": 0.7460285614616118,
      "threshold": 0.65,
      "class_accuracy": 0.9955503512880562,
      "switch_macro_f1": 0.9014125309089338,
      "per_switch_f1": [
        0.8288288288288289,
        0.9208633093525179,
        0.9545454545454545
      ],
      "per_switch_recall": [
        0.71875,
        1.0,
        0.984375
      ],
      "episode_switch_delays": {
        "4": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 10
        },
        "5": {
          "0->1": 5,
          "1->2": 1,
          "2->3": 1
        },
        "14": {
          "0->1": null,
          "1->2": null,
          "2->3": null
        },
        "19": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 5
        }
      }
    },
    {
      "early_switch_count": 0,
      "sequence_completion_rate": 0.75,
      "chunk_language_accuracy": 0.76171875,
      "frame_language_accuracy": 0.7460285614616118,
      "threshold": 0.7,
      "class_accuracy": 0.9955503512880562,
      "switch_macro_f1": 0.8987523412258435,
      "per_switch_f1": [
        0.8288288288288289,
        0.9208633093525179,
        0.9465648854961832
      ],
      "per_switch_recall": [
        0.71875,
        1.0,
        0.96875
      ],
      "episode_switch_delays": {
        "4": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 10
        },
        "5": {
          "0->1": 5,
          "1->2": 1,
          "2->3": 1
        },
        "14": {
          "0->1": null,
          "1->2": null,
          "2->3": null
        },
        "19": {
          "0->1": 8,
          "1->2": 10,
          "2->3": 5
        }
      }
    }
  ],
  "reports": [
    {
      "model_path": "/home/ubuntu/groot_workspace/checkpoints/siglip2_decision_4class_state22_woidle_post1chunk/best_model.pt",
      "test_episodes": [
        4,
        5,
        14,
        19
      ],
      "threshold": 0.2,
      "require_next_class": true,
      "frame_metrics": {
        "class_accuracy": 0.9955503512880562,
        "switch_macro_f1": 0.8983067854007274,
        "per_switch": [
          {
            "transition": "0->1",
            "tp": 50,
            "fp": 5,
            "fn": 14,
            "tn": 4201,
            "precision": 0.9090909090909091,
            "recall": 0.78125,
            "f1": 0.8403361344537814
          },
          {
            "transition": "1->2",
            "tp": 64,
            "fp": 12,
            "fn": 0,
            "tn": 4194,
            "precision": 0.8421052631578947,
            "recall": 1.0,
            "f1": 0.9142857142857143
          },
          {
            "transition": "2->3",
            "tp": 63,
            "fp": 7,
            "fn": 1,
            "tn": 4199,
            "precision": 0.9,
            "recall": 0.984375,
            "f1": 0.9402985074626866
          }
        ]
      },
      "episode_metrics": [
        {
          "episode_index": 4,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9742647058823529,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 10
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 512,
            "2->3": 688
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 502,
              "from": 1,
              "to": 2
            },
            {
              "frame": 678,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 5,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9937722419928826,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 5,
            "1->2": 1,
            "2->3": 1
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 544,
            "2->3": 720
          },
          "boundaries": [
            {
              "frame": 43,
              "from": 0,
              "to": 1
            },
            {
              "frame": 543,
              "from": 1,
              "to": 2
            },
            {
              "frame": 719,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 14,
          "chunk_language_accuracy": 0.046875,
          "frame_language_accuracy": 0.03823529411764706,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": null,
            "1->2": null,
            "2->3": null
          },
          "sequence_completed": false,
          "switch_frames": {},
          "boundaries": [
            {
              "frame": 39,
              "from": 0,
              "to": 1
            },
            {
              "frame": 484,
              "from": 1,
              "to": 2
            },
            {
              "frame": 663,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 19,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9778420038535646,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 5
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 496,
            "2->3": 672
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 486,
              "from": 1,
              "to": 2
            },
            {
              "frame": 667,
              "from": 2,
              "to": 3
            }
          ]
        }
      ],
      "summary": {
        "early_switch_count": 0,
        "sequence_completion_rate": 0.75,
        "chunk_language_accuracy": 0.76171875,
        "frame_language_accuracy": 0.7460285614616118
      }
    },
    {
      "model_path": "/home/ubuntu/groot_workspace/checkpoints/siglip2_decision_4class_state22_woidle_post1chunk/best_model.pt",
      "test_episodes": [
        4,
        5,
        14,
        19
      ],
      "threshold": 0.25,
      "require_next_class": true,
      "frame_metrics": {
        "class_accuracy": 0.9955503512880562,
        "switch_macro_f1": 0.8983067854007274,
        "per_switch": [
          {
            "transition": "0->1",
            "tp": 50,
            "fp": 5,
            "fn": 14,
            "tn": 4201,
            "precision": 0.9090909090909091,
            "recall": 0.78125,
            "f1": 0.8403361344537814
          },
          {
            "transition": "1->2",
            "tp": 64,
            "fp": 12,
            "fn": 0,
            "tn": 4194,
            "precision": 0.8421052631578947,
            "recall": 1.0,
            "f1": 0.9142857142857143
          },
          {
            "transition": "2->3",
            "tp": 63,
            "fp": 7,
            "fn": 1,
            "tn": 4199,
            "precision": 0.9,
            "recall": 0.984375,
            "f1": 0.9402985074626866
          }
        ]
      },
      "episode_metrics": [
        {
          "episode_index": 4,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9742647058823529,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 10
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 512,
            "2->3": 688
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 502,
              "from": 1,
              "to": 2
            },
            {
              "frame": 678,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 5,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9937722419928826,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 5,
            "1->2": 1,
            "2->3": 1
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 544,
            "2->3": 720
          },
          "boundaries": [
            {
              "frame": 43,
              "from": 0,
              "to": 1
            },
            {
              "frame": 543,
              "from": 1,
              "to": 2
            },
            {
              "frame": 719,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 14,
          "chunk_language_accuracy": 0.046875,
          "frame_language_accuracy": 0.03823529411764706,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": null,
            "1->2": null,
            "2->3": null
          },
          "sequence_completed": false,
          "switch_frames": {},
          "boundaries": [
            {
              "frame": 39,
              "from": 0,
              "to": 1
            },
            {
              "frame": 484,
              "from": 1,
              "to": 2
            },
            {
              "frame": 663,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 19,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9778420038535646,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 5
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 496,
            "2->3": 672
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 486,
              "from": 1,
              "to": 2
            },
            {
              "frame": 667,
              "from": 2,
              "to": 3
            }
          ]
        }
      ],
      "summary": {
        "early_switch_count": 0,
        "sequence_completion_rate": 0.75,
        "chunk_language_accuracy": 0.76171875,
        "frame_language_accuracy": 0.7460285614616118
      }
    },
    {
      "model_path": "/home/ubuntu/groot_workspace/checkpoints/siglip2_decision_4class_state22_woidle_post1chunk/best_model.pt",
      "test_episodes": [
        4,
        5,
        14,
        19
      ],
      "threshold": 0.3,
      "require_next_class": true,
      "frame_metrics": {
        "class_accuracy": 0.9955503512880562,
        "switch_macro_f1": 0.9006806162890149,
        "per_switch": [
          {
            "transition": "0->1",
            "tp": 50,
            "fp": 4,
            "fn": 14,
            "tn": 4202,
            "precision": 0.9259259259259259,
            "recall": 0.78125,
            "f1": 0.847457627118644
          },
          {
            "transition": "1->2",
            "tp": 64,
            "fp": 12,
            "fn": 0,
            "tn": 4194,
            "precision": 0.8421052631578947,
            "recall": 1.0,
            "f1": 0.9142857142857143
          },
          {
            "transition": "2->3",
            "tp": 63,
            "fp": 7,
            "fn": 1,
            "tn": 4199,
            "precision": 0.9,
            "recall": 0.984375,
            "f1": 0.9402985074626866
          }
        ]
      },
      "episode_metrics": [
        {
          "episode_index": 4,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9742647058823529,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 10
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 512,
            "2->3": 688
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 502,
              "from": 1,
              "to": 2
            },
            {
              "frame": 678,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 5,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9937722419928826,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 5,
            "1->2": 1,
            "2->3": 1
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 544,
            "2->3": 720
          },
          "boundaries": [
            {
              "frame": 43,
              "from": 0,
              "to": 1
            },
            {
              "frame": 543,
              "from": 1,
              "to": 2
            },
            {
              "frame": 719,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 14,
          "chunk_language_accuracy": 0.046875,
          "frame_language_accuracy": 0.03823529411764706,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": null,
            "1->2": null,
            "2->3": null
          },
          "sequence_completed": false,
          "switch_frames": {},
          "boundaries": [
            {
              "frame": 39,
              "from": 0,
              "to": 1
            },
            {
              "frame": 484,
              "from": 1,
              "to": 2
            },
            {
              "frame": 663,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 19,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9778420038535646,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 5
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 496,
            "2->3": 672
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 486,
              "from": 1,
              "to": 2
            },
            {
              "frame": 667,
              "from": 2,
              "to": 3
            }
          ]
        }
      ],
      "summary": {
        "early_switch_count": 0,
        "sequence_completion_rate": 0.75,
        "chunk_language_accuracy": 0.76171875,
        "frame_language_accuracy": 0.7460285614616118
      }
    },
    {
      "model_path": "/home/ubuntu/groot_workspace/checkpoints/siglip2_decision_4class_state22_woidle_post1chunk/best_model.pt",
      "test_episodes": [
        4,
        5,
        14,
        19
      ],
      "threshold": 0.35,
      "require_next_class": true,
      "frame_metrics": {
        "class_accuracy": 0.9955503512880562,
        "switch_macro_f1": 0.8973970197850795,
        "per_switch": [
          {
            "transition": "0->1",
            "tp": 49,
            "fp": 4,
            "fn": 15,
            "tn": 4202,
            "precision": 0.9245283018867925,
            "recall": 0.765625,
            "f1": 0.8376068376068376
          },
          {
            "transition": "1->2",
            "tp": 64,
            "fp": 12,
            "fn": 0,
            "tn": 4194,
            "precision": 0.8421052631578947,
            "recall": 1.0,
            "f1": 0.9142857142857143
          },
          {
            "transition": "2->3",
            "tp": 63,
            "fp": 7,
            "fn": 1,
            "tn": 4199,
            "precision": 0.9,
            "recall": 0.984375,
            "f1": 0.9402985074626866
          }
        ]
      },
      "episode_metrics": [
        {
          "episode_index": 4,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9742647058823529,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 10
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 512,
            "2->3": 688
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 502,
              "from": 1,
              "to": 2
            },
            {
              "frame": 678,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 5,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9937722419928826,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 5,
            "1->2": 1,
            "2->3": 1
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 544,
            "2->3": 720
          },
          "boundaries": [
            {
              "frame": 43,
              "from": 0,
              "to": 1
            },
            {
              "frame": 543,
              "from": 1,
              "to": 2
            },
            {
              "frame": 719,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 14,
          "chunk_language_accuracy": 0.046875,
          "frame_language_accuracy": 0.03823529411764706,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": null,
            "1->2": null,
            "2->3": null
          },
          "sequence_completed": false,
          "switch_frames": {},
          "boundaries": [
            {
              "frame": 39,
              "from": 0,
              "to": 1
            },
            {
              "frame": 484,
              "from": 1,
              "to": 2
            },
            {
              "frame": 663,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 19,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9778420038535646,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 5
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 496,
            "2->3": 672
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 486,
              "from": 1,
              "to": 2
            },
            {
              "frame": 667,
              "from": 2,
              "to": 3
            }
          ]
        }
      ],
      "summary": {
        "early_switch_count": 0,
        "sequence_completion_rate": 0.75,
        "chunk_language_accuracy": 0.76171875,
        "frame_language_accuracy": 0.7460285614616118
      }
    },
    {
      "model_path": "/home/ubuntu/groot_workspace/checkpoints/siglip2_decision_4class_state22_woidle_post1chunk/best_model.pt",
      "test_episodes": [
        4,
        5,
        14,
        19
      ],
      "threshold": 0.4,
      "require_next_class": true,
      "frame_metrics": {
        "class_accuracy": 0.9955503512880562,
        "switch_macro_f1": 0.8940568095483176,
        "per_switch": [
          {
            "transition": "0->1",
            "tp": 48,
            "fp": 4,
            "fn": 16,
            "tn": 4202,
            "precision": 0.9230769230769231,
            "recall": 0.75,
            "f1": 0.8275862068965517
          },
          {
            "transition": "1->2",
            "tp": 64,
            "fp": 12,
            "fn": 0,
            "tn": 4194,
            "precision": 0.8421052631578947,
            "recall": 1.0,
            "f1": 0.9142857142857143
          },
          {
            "transition": "2->3",
            "tp": 63,
            "fp": 7,
            "fn": 1,
            "tn": 4199,
            "precision": 0.9,
            "recall": 0.984375,
            "f1": 0.9402985074626866
          }
        ]
      },
      "episode_metrics": [
        {
          "episode_index": 4,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9742647058823529,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 10
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 512,
            "2->3": 688
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 502,
              "from": 1,
              "to": 2
            },
            {
              "frame": 678,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 5,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9937722419928826,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 5,
            "1->2": 1,
            "2->3": 1
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 544,
            "2->3": 720
          },
          "boundaries": [
            {
              "frame": 43,
              "from": 0,
              "to": 1
            },
            {
              "frame": 543,
              "from": 1,
              "to": 2
            },
            {
              "frame": 719,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 14,
          "chunk_language_accuracy": 0.046875,
          "frame_language_accuracy": 0.03823529411764706,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": null,
            "1->2": null,
            "2->3": null
          },
          "sequence_completed": false,
          "switch_frames": {},
          "boundaries": [
            {
              "frame": 39,
              "from": 0,
              "to": 1
            },
            {
              "frame": 484,
              "from": 1,
              "to": 2
            },
            {
              "frame": 663,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 19,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9778420038535646,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 5
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 496,
            "2->3": 672
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 486,
              "from": 1,
              "to": 2
            },
            {
              "frame": 667,
              "from": 2,
              "to": 3
            }
          ]
        }
      ],
      "summary": {
        "early_switch_count": 0,
        "sequence_completion_rate": 0.75,
        "chunk_language_accuracy": 0.76171875,
        "frame_language_accuracy": 0.7460285614616118
      }
    },
    {
      "model_path": "/home/ubuntu/groot_workspace/checkpoints/siglip2_decision_4class_state22_woidle_post1chunk/best_model.pt",
      "test_episodes": [
        4,
        5,
        14,
        19
      ],
      "threshold": 0.45,
      "require_next_class": true,
      "frame_metrics": {
        "class_accuracy": 0.9955503512880562,
        "switch_macro_f1": 0.8940568095483176,
        "per_switch": [
          {
            "transition": "0->1",
            "tp": 48,
            "fp": 4,
            "fn": 16,
            "tn": 4202,
            "precision": 0.9230769230769231,
            "recall": 0.75,
            "f1": 0.8275862068965517
          },
          {
            "transition": "1->2",
            "tp": 64,
            "fp": 12,
            "fn": 0,
            "tn": 4194,
            "precision": 0.8421052631578947,
            "recall": 1.0,
            "f1": 0.9142857142857143
          },
          {
            "transition": "2->3",
            "tp": 63,
            "fp": 7,
            "fn": 1,
            "tn": 4199,
            "precision": 0.9,
            "recall": 0.984375,
            "f1": 0.9402985074626866
          }
        ]
      },
      "episode_metrics": [
        {
          "episode_index": 4,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9742647058823529,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 10
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 512,
            "2->3": 688
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 502,
              "from": 1,
              "to": 2
            },
            {
              "frame": 678,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 5,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9937722419928826,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 5,
            "1->2": 1,
            "2->3": 1
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 544,
            "2->3": 720
          },
          "boundaries": [
            {
              "frame": 43,
              "from": 0,
              "to": 1
            },
            {
              "frame": 543,
              "from": 1,
              "to": 2
            },
            {
              "frame": 719,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 14,
          "chunk_language_accuracy": 0.046875,
          "frame_language_accuracy": 0.03823529411764706,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": null,
            "1->2": null,
            "2->3": null
          },
          "sequence_completed": false,
          "switch_frames": {},
          "boundaries": [
            {
              "frame": 39,
              "from": 0,
              "to": 1
            },
            {
              "frame": 484,
              "from": 1,
              "to": 2
            },
            {
              "frame": 663,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 19,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9778420038535646,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 5
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 496,
            "2->3": 672
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 486,
              "from": 1,
              "to": 2
            },
            {
              "frame": 667,
              "from": 2,
              "to": 3
            }
          ]
        }
      ],
      "summary": {
        "early_switch_count": 0,
        "sequence_completion_rate": 0.75,
        "chunk_language_accuracy": 0.76171875,
        "frame_language_accuracy": 0.7460285614616118
      }
    },
    {
      "model_path": "/home/ubuntu/groot_workspace/checkpoints/siglip2_decision_4class_state22_woidle_post1chunk/best_model.pt",
      "test_episodes": [
        4,
        5,
        14,
        19
      ],
      "threshold": 0.5,
      "require_next_class": true,
      "frame_metrics": {
        "class_accuracy": 0.9955503512880562,
        "switch_macro_f1": 0.9010890266576999,
        "per_switch": [
          {
            "transition": "0->1",
            "tp": 48,
            "fp": 2,
            "fn": 16,
            "tn": 4204,
            "precision": 0.96,
            "recall": 0.75,
            "f1": 0.8421052631578947
          },
          {
            "transition": "1->2",
            "tp": 64,
            "fp": 11,
            "fn": 0,
            "tn": 4195,
            "precision": 0.8533333333333334,
            "recall": 1.0,
            "f1": 0.9208633093525179
          },
          {
            "transition": "2->3",
            "tp": 63,
            "fp": 7,
            "fn": 1,
            "tn": 4199,
            "precision": 0.9,
            "recall": 0.984375,
            "f1": 0.9402985074626866
          }
        ]
      },
      "episode_metrics": [
        {
          "episode_index": 4,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9742647058823529,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 10
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 512,
            "2->3": 688
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 502,
              "from": 1,
              "to": 2
            },
            {
              "frame": 678,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 5,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9937722419928826,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 5,
            "1->2": 1,
            "2->3": 1
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 544,
            "2->3": 720
          },
          "boundaries": [
            {
              "frame": 43,
              "from": 0,
              "to": 1
            },
            {
              "frame": 543,
              "from": 1,
              "to": 2
            },
            {
              "frame": 719,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 14,
          "chunk_language_accuracy": 0.046875,
          "frame_language_accuracy": 0.03823529411764706,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": null,
            "1->2": null,
            "2->3": null
          },
          "sequence_completed": false,
          "switch_frames": {},
          "boundaries": [
            {
              "frame": 39,
              "from": 0,
              "to": 1
            },
            {
              "frame": 484,
              "from": 1,
              "to": 2
            },
            {
              "frame": 663,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 19,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9778420038535646,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 5
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 496,
            "2->3": 672
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 486,
              "from": 1,
              "to": 2
            },
            {
              "frame": 667,
              "from": 2,
              "to": 3
            }
          ]
        }
      ],
      "summary": {
        "early_switch_count": 0,
        "sequence_completion_rate": 0.75,
        "chunk_language_accuracy": 0.76171875,
        "frame_language_accuracy": 0.7460285614616118
      }
    },
    {
      "model_path": "/home/ubuntu/groot_workspace/checkpoints/siglip2_decision_4class_state22_woidle_post1chunk/best_model.pt",
      "test_episodes": [
        4,
        5,
        14,
        19
      ],
      "threshold": 0.55,
      "require_next_class": true,
      "frame_metrics": {
        "class_accuracy": 0.9955503512880562,
        "switch_macro_f1": 0.8941967960812587,
        "per_switch": [
          {
            "transition": "0->1",
            "tp": 46,
            "fp": 2,
            "fn": 18,
            "tn": 4204,
            "precision": 0.9583333333333334,
            "recall": 0.71875,
            "f1": 0.8214285714285714
          },
          {
            "transition": "1->2",
            "tp": 64,
            "fp": 11,
            "fn": 0,
            "tn": 4195,
            "precision": 0.8533333333333334,
            "recall": 1.0,
            "f1": 0.9208633093525179
          },
          {
            "transition": "2->3",
            "tp": 63,
            "fp": 7,
            "fn": 1,
            "tn": 4199,
            "precision": 0.9,
            "recall": 0.984375,
            "f1": 0.9402985074626866
          }
        ]
      },
      "episode_metrics": [
        {
          "episode_index": 4,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9742647058823529,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 10
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 512,
            "2->3": 688
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 502,
              "from": 1,
              "to": 2
            },
            {
              "frame": 678,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 5,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9937722419928826,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 5,
            "1->2": 1,
            "2->3": 1
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 544,
            "2->3": 720
          },
          "boundaries": [
            {
              "frame": 43,
              "from": 0,
              "to": 1
            },
            {
              "frame": 543,
              "from": 1,
              "to": 2
            },
            {
              "frame": 719,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 14,
          "chunk_language_accuracy": 0.046875,
          "frame_language_accuracy": 0.03823529411764706,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": null,
            "1->2": null,
            "2->3": null
          },
          "sequence_completed": false,
          "switch_frames": {},
          "boundaries": [
            {
              "frame": 39,
              "from": 0,
              "to": 1
            },
            {
              "frame": 484,
              "from": 1,
              "to": 2
            },
            {
              "frame": 663,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 19,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9778420038535646,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 5
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 496,
            "2->3": 672
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 486,
              "from": 1,
              "to": 2
            },
            {
              "frame": 667,
              "from": 2,
              "to": 3
            }
          ]
        }
      ],
      "summary": {
        "early_switch_count": 0,
        "sequence_completion_rate": 0.75,
        "chunk_language_accuracy": 0.76171875,
        "frame_language_accuracy": 0.7460285614616118
      }
    },
    {
      "model_path": "/home/ubuntu/groot_workspace/checkpoints/siglip2_decision_4class_state22_woidle_post1chunk/best_model.pt",
      "test_episodes": [
        4,
        5,
        14,
        19
      ],
      "threshold": 0.6,
      "require_next_class": true,
      "frame_metrics": {
        "class_accuracy": 0.9955503512880562,
        "switch_macro_f1": 0.8990201864113261,
        "per_switch": [
          {
            "transition": "0->1",
            "tp": 46,
            "fp": 1,
            "fn": 18,
            "tn": 4205,
            "precision": 0.9787234042553191,
            "recall": 0.71875,
            "f1": 0.8288288288288289
          },
          {
            "transition": "1->2",
            "tp": 64,
            "fp": 11,
            "fn": 0,
            "tn": 4195,
            "precision": 0.8533333333333334,
            "recall": 1.0,
            "f1": 0.9208633093525179
          },
          {
            "transition": "2->3",
            "tp": 63,
            "fp": 6,
            "fn": 1,
            "tn": 4200,
            "precision": 0.9130434782608695,
            "recall": 0.984375,
            "f1": 0.9473684210526315
          }
        ]
      },
      "episode_metrics": [
        {
          "episode_index": 4,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9742647058823529,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 10
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 512,
            "2->3": 688
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 502,
              "from": 1,
              "to": 2
            },
            {
              "frame": 678,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 5,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9937722419928826,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 5,
            "1->2": 1,
            "2->3": 1
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 544,
            "2->3": 720
          },
          "boundaries": [
            {
              "frame": 43,
              "from": 0,
              "to": 1
            },
            {
              "frame": 543,
              "from": 1,
              "to": 2
            },
            {
              "frame": 719,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 14,
          "chunk_language_accuracy": 0.046875,
          "frame_language_accuracy": 0.03823529411764706,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": null,
            "1->2": null,
            "2->3": null
          },
          "sequence_completed": false,
          "switch_frames": {},
          "boundaries": [
            {
              "frame": 39,
              "from": 0,
              "to": 1
            },
            {
              "frame": 484,
              "from": 1,
              "to": 2
            },
            {
              "frame": 663,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 19,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9778420038535646,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 5
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 496,
            "2->3": 672
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 486,
              "from": 1,
              "to": 2
            },
            {
              "frame": 667,
              "from": 2,
              "to": 3
            }
          ]
        }
      ],
      "summary": {
        "early_switch_count": 0,
        "sequence_completion_rate": 0.75,
        "chunk_language_accuracy": 0.76171875,
        "frame_language_accuracy": 0.7460285614616118
      }
    },
    {
      "model_path": "/home/ubuntu/groot_workspace/checkpoints/siglip2_decision_4class_state22_woidle_post1chunk/best_model.pt",
      "test_episodes": [
        4,
        5,
        14,
        19
      ],
      "threshold": 0.65,
      "require_next_class": true,
      "frame_metrics": {
        "class_accuracy": 0.9955503512880562,
        "switch_macro_f1": 0.9014125309089338,
        "per_switch": [
          {
            "transition": "0->1",
            "tp": 46,
            "fp": 1,
            "fn": 18,
            "tn": 4205,
            "precision": 0.9787234042553191,
            "recall": 0.71875,
            "f1": 0.8288288288288289
          },
          {
            "transition": "1->2",
            "tp": 64,
            "fp": 11,
            "fn": 0,
            "tn": 4195,
            "precision": 0.8533333333333334,
            "recall": 1.0,
            "f1": 0.9208633093525179
          },
          {
            "transition": "2->3",
            "tp": 63,
            "fp": 5,
            "fn": 1,
            "tn": 4201,
            "precision": 0.9264705882352942,
            "recall": 0.984375,
            "f1": 0.9545454545454545
          }
        ]
      },
      "episode_metrics": [
        {
          "episode_index": 4,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9742647058823529,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 10
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 512,
            "2->3": 688
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 502,
              "from": 1,
              "to": 2
            },
            {
              "frame": 678,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 5,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9937722419928826,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 5,
            "1->2": 1,
            "2->3": 1
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 544,
            "2->3": 720
          },
          "boundaries": [
            {
              "frame": 43,
              "from": 0,
              "to": 1
            },
            {
              "frame": 543,
              "from": 1,
              "to": 2
            },
            {
              "frame": 719,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 14,
          "chunk_language_accuracy": 0.046875,
          "frame_language_accuracy": 0.03823529411764706,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": null,
            "1->2": null,
            "2->3": null
          },
          "sequence_completed": false,
          "switch_frames": {},
          "boundaries": [
            {
              "frame": 39,
              "from": 0,
              "to": 1
            },
            {
              "frame": 484,
              "from": 1,
              "to": 2
            },
            {
              "frame": 663,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 19,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9778420038535646,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 5
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 496,
            "2->3": 672
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 486,
              "from": 1,
              "to": 2
            },
            {
              "frame": 667,
              "from": 2,
              "to": 3
            }
          ]
        }
      ],
      "summary": {
        "early_switch_count": 0,
        "sequence_completion_rate": 0.75,
        "chunk_language_accuracy": 0.76171875,
        "frame_language_accuracy": 0.7460285614616118
      }
    },
    {
      "model_path": "/home/ubuntu/groot_workspace/checkpoints/siglip2_decision_4class_state22_woidle_post1chunk/best_model.pt",
      "test_episodes": [
        4,
        5,
        14,
        19
      ],
      "threshold": 0.7,
      "require_next_class": true,
      "frame_metrics": {
        "class_accuracy": 0.9955503512880562,
        "switch_macro_f1": 0.8987523412258435,
        "per_switch": [
          {
            "transition": "0->1",
            "tp": 46,
            "fp": 1,
            "fn": 18,
            "tn": 4205,
            "precision": 0.9787234042553191,
            "recall": 0.71875,
            "f1": 0.8288288288288289
          },
          {
            "transition": "1->2",
            "tp": 64,
            "fp": 11,
            "fn": 0,
            "tn": 4195,
            "precision": 0.8533333333333334,
            "recall": 1.0,
            "f1": 0.9208633093525179
          },
          {
            "transition": "2->3",
            "tp": 62,
            "fp": 5,
            "fn": 2,
            "tn": 4201,
            "precision": 0.9253731343283582,
            "recall": 0.96875,
            "f1": 0.9465648854961832
          }
        ]
      },
      "episode_metrics": [
        {
          "episode_index": 4,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9742647058823529,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 10
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 512,
            "2->3": 688
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 502,
              "from": 1,
              "to": 2
            },
            {
              "frame": 678,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 5,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9937722419928826,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 5,
            "1->2": 1,
            "2->3": 1
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 544,
            "2->3": 720
          },
          "boundaries": [
            {
              "frame": 43,
              "from": 0,
              "to": 1
            },
            {
              "frame": 543,
              "from": 1,
              "to": 2
            },
            {
              "frame": 719,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 14,
          "chunk_language_accuracy": 0.046875,
          "frame_language_accuracy": 0.03823529411764706,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": null,
            "1->2": null,
            "2->3": null
          },
          "sequence_completed": false,
          "switch_frames": {},
          "boundaries": [
            {
              "frame": 39,
              "from": 0,
              "to": 1
            },
            {
              "frame": 484,
              "from": 1,
              "to": 2
            },
            {
              "frame": 663,
              "from": 2,
              "to": 3
            }
          ]
        },
        {
          "episode_index": 19,
          "chunk_language_accuracy": 1.0,
          "frame_language_accuracy": 0.9778420038535646,
          "early_switch_count": 0,
          "switch_delays": {
            "0->1": 8,
            "1->2": 10,
            "2->3": 5
          },
          "sequence_completed": true,
          "switch_frames": {
            "0->1": 48,
            "1->2": 496,
            "2->3": 672
          },
          "boundaries": [
            {
              "frame": 40,
              "from": 0,
              "to": 1
            },
            {
              "frame": 486,
              "from": 1,
              "to": 2
            },
            {
              "frame": 667,
              "from": 2,
              "to": 3
            }
          ]
        }
      ],
      "summary": {
        "early_switch_count": 0,
        "sequence_completion_rate": 0.75,
        "chunk_language_accuracy": 0.76171875,
        "frame_language_accuracy": 0.7460285614616118
      }
    }
  ]
}