Upload MIMIC character checkpoints + model card

Files changed (4) hide show

README.md CHANGED Viewed

@@ -34,7 +34,7 @@ outputs controller inputs (main stick, c-stick, shoulder, buttons) at 60 Hz.
 | Character | Games | Val btn F1 | Val main F1 | Val loss | Step |
 |---|---|---|---|---|---|
-| **Fox** | 17,319 | ~59% | ~15% | 2.27 | 28,165 |
 | **Falco** | 9,110 | 88.2% | 58.5% | 0.68 | 28,122 |
 | **Captain Falcon** | 9,404 | 89.9% | 52.2% | 0.71 | 26,814 |
 | **Luigi** | 1,951 | ~91% | ~60% | ~1.0 | 5,242 |

 | Character | Games | Val btn F1 | Val main F1 | Val loss | Step |
 |---|---|---|---|---|---|
+| **Fox** | 17,319 | 87.7% | ~55% | 0.77 | 31,065 |
 | **Falco** | 9,110 | 88.2% | 58.5% | 0.68 | 28,122 |
 | **Captain Falcon** | 9,404 | 89.9% | 52.2% | 0.71 | 26,814 |
 | **Luigi** | 1,951 | ~91% | ~60% | ~1.0 | 5,242 |

fox/config.json CHANGED Viewed

@@ -3,14 +3,14 @@
   "nhead": 8,
   "num_layers": 6,
   "dim_feedforward": 2048,
-  "dropout": 0.2,
   "encoder_type": "hal_flat",
   "d_intra": 256,
   "encoder_nlayers": 2,
   "k_query": 1,
   "scaled_emb": false,
   "max_seq_len": 256,
-  "pos_enc": "relpos",
   "rope_theta": 10000.0,
   "rope_learnable_freqs": false,
   "xpos_scale_base": 0.0,
@@ -21,7 +21,7 @@
   "stick_loss": "clusters",
   "btn_loss": "focal",
   "no_opp_inputs": true,
-  "no_self_inputs": true,
   "head_hidden": 256,
   "n_stick_clusters": 37,
   "n_shoulder_bins": 3,
@@ -39,6 +39,6 @@
   "num_c_dirs": 9,
   "num_proj_types": 103,
   "num_proj_subtypes": 40,
-  "model_preset": "hal",
-  "run_name": "hal-7class-v2-long"
 }

   "nhead": 8,
   "num_layers": 6,
   "dim_feedforward": 2048,
+  "dropout": 0.1,
   "encoder_type": "hal_flat",
   "d_intra": 256,
   "encoder_nlayers": 2,
   "k_query": 1,
   "scaled_emb": false,
   "max_seq_len": 256,
+  "pos_enc": "rope",
   "rope_theta": 10000.0,
   "rope_learnable_freqs": false,
   "xpos_scale_base": 0.0,
   "stick_loss": "clusters",
   "btn_loss": "focal",
   "no_opp_inputs": true,
+  "no_self_inputs": false,
   "head_hidden": 256,
   "n_stick_clusters": 37,
   "n_shoulder_bins": 3,
   "num_c_dirs": 9,
   "num_proj_types": 103,
   "num_proj_subtypes": 40,
+  "model_preset": "hal-rope",
+  "run_name": "fox-rope-v2"
 }

fox/metadata.json CHANGED Viewed

@@ -1,16 +1,16 @@
 {
   "character": "Fox",
   "melee_enum": "FOX",
-  "run_name": "hal-7class-v2-long",
-  "global_step": 28165,
   "games_trained": 17319,
-  "val_btn_f1": "~59%",
-  "val_main_f1": "~15%",
-  "val_loss": "2.27",
-  "n_params": 26247717,
   "n_controller_combos": 7,
-  "model_preset": "hal",
-  "pos_enc": "relpos",
-  "no_self_inputs": true,
-  "training_notes": "Legacy checkpoint from the 2026-04-11 hal-7class-v2-long run. Trained WITHOUT --self-inputs, which is why the val metrics look much lower than the other characters. Still plays actively in Dolphin but performance is below the Falco/CptFalcon/Luigi models. A new Fox run with --self-inputs is a todo."
 }

 {
   "character": "Fox",
   "melee_enum": "FOX",
+  "run_name": "fox-rope-v2",
+  "global_step": 31065,
   "games_trained": 17319,
+  "val_btn_f1": "87.7%",
+  "val_main_f1": "~55%",
+  "val_loss": "0.77",
+  "n_params": 19591909,
   "n_controller_combos": 7,
+  "model_preset": "hal-rope",
+  "pos_enc": "rope",
+  "no_self_inputs": false,
+  "training_notes": "Trained 2026-04-13, fox-rope-v2 run. v2 shards, RoPE position encoding (hal-rope preset), --self-inputs, dropout 0.1, 32K steps at batch 512. Replaces the legacy hal-7class-v2-long checkpoint which was trained without --self-inputs and stuck at val loss 2.27. The self-inputs flag was the real fix \u2014 RoPE vs relpos is secondary. Metrics land alongside Falco/CptFalcon/Luigi."
 }

fox/model.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b7bcb0d0b3d4a0cddcf18887cc9deee36a2910cafa5fca4b0a360cae68f04c20
-size 264795225

 version https://git-lfs.github.com/spec/v1
+oid sha256:41ee9f42c3f5c8d03dfe799e2e8b08a142a88fe3328e295e99ebcf855162def0
+size 235274570