Upload MIMIC character checkpoints + model card
Browse files- README.md +1 -4
- fox/config.json +10 -7
- fox/metadata.json +7 -7
- fox/model.pt +2 -2
README.md
CHANGED
|
@@ -34,10 +34,7 @@ outputs controller inputs (main stick, c-stick, shoulder, buttons) at 60 Hz.
|
|
| 34 |
|
| 35 |
| Character | Games | Val btn F1 | Val main F1 | Val loss | Step |
|
| 36 |
|---|---|---|---|---|---|
|
| 37 |
-
| **Fox** | 17,319 | 87.
|
| 38 |
-
| **Falco** | 9,110 | 88.2% | 58.5% | 0.68 | 28,122 |
|
| 39 |
-
| **Captain Falcon** | 9,404 | 89.9% | 52.2% | 0.71 | 26,814 |
|
| 40 |
-
| **Luigi** | 1,951 | ~91% | ~60% | ~1.0 | 5,242 |
|
| 41 |
|
| 42 |
## Repo layout
|
| 43 |
|
|
|
|
| 34 |
|
| 35 |
| Character | Games | Val btn F1 | Val main F1 | Val loss | Step |
|
| 36 |
|---|---|---|---|---|---|
|
| 37 |
+
| **Fox** | 17,319 | 87.1% | ~55% | 0.77 | 55,692 |
|
|
|
|
|
|
|
|
|
|
| 38 |
|
| 39 |
## Repo layout
|
| 40 |
|
fox/config.json
CHANGED
|
@@ -3,14 +3,14 @@
|
|
| 3 |
"nhead": 8,
|
| 4 |
"num_layers": 6,
|
| 5 |
"dim_feedforward": 2048,
|
| 6 |
-
"dropout": 0.
|
| 7 |
-
"encoder_type": "
|
| 8 |
"d_intra": 256,
|
| 9 |
"encoder_nlayers": 2,
|
| 10 |
"k_query": 1,
|
| 11 |
"scaled_emb": false,
|
| 12 |
"max_seq_len": 256,
|
| 13 |
-
"pos_enc": "
|
| 14 |
"rope_theta": 10000.0,
|
| 15 |
"rope_learnable_freqs": false,
|
| 16 |
"xpos_scale_base": 0.0,
|
|
@@ -26,11 +26,14 @@
|
|
| 26 |
"n_stick_clusters": 37,
|
| 27 |
"n_shoulder_bins": 3,
|
| 28 |
"autoregressive_heads": true,
|
| 29 |
-
"
|
| 30 |
"lean_features": false,
|
|
|
|
|
|
|
|
|
|
|
|
|
| 31 |
"hal_minimal_features": true,
|
| 32 |
"hal_controller_encoding": true,
|
| 33 |
-
"n_controller_combos": 7,
|
| 34 |
"num_stages": 6,
|
| 35 |
"num_ports": 4,
|
| 36 |
"num_characters": 27,
|
|
@@ -39,6 +42,6 @@
|
|
| 39 |
"num_c_dirs": 9,
|
| 40 |
"num_proj_types": 103,
|
| 41 |
"num_proj_subtypes": 40,
|
| 42 |
-
"model_preset": "
|
| 43 |
-
"run_name": "fox-
|
| 44 |
}
|
|
|
|
| 3 |
"nhead": 8,
|
| 4 |
"num_layers": 6,
|
| 5 |
"dim_feedforward": 2048,
|
| 6 |
+
"dropout": 0.2,
|
| 7 |
+
"encoder_type": "mimic_flat",
|
| 8 |
"d_intra": 256,
|
| 9 |
"encoder_nlayers": 2,
|
| 10 |
"k_query": 1,
|
| 11 |
"scaled_emb": false,
|
| 12 |
"max_seq_len": 256,
|
| 13 |
+
"pos_enc": "relpos",
|
| 14 |
"rope_theta": 10000.0,
|
| 15 |
"rope_learnable_freqs": false,
|
| 16 |
"xpos_scale_base": 0.0,
|
|
|
|
| 26 |
"n_stick_clusters": 37,
|
| 27 |
"n_shoulder_bins": 3,
|
| 28 |
"autoregressive_heads": true,
|
| 29 |
+
"mimic_mode": true,
|
| 30 |
"lean_features": false,
|
| 31 |
+
"mimic_minimal_features": true,
|
| 32 |
+
"mimic_controller_encoding": true,
|
| 33 |
+
"n_controller_combos": 7,
|
| 34 |
+
"hal_mode": true,
|
| 35 |
"hal_minimal_features": true,
|
| 36 |
"hal_controller_encoding": true,
|
|
|
|
| 37 |
"num_stages": 6,
|
| 38 |
"num_ports": 4,
|
| 39 |
"num_characters": 27,
|
|
|
|
| 42 |
"num_c_dirs": 9,
|
| 43 |
"num_proj_types": 103,
|
| 44 |
"num_proj_subtypes": 40,
|
| 45 |
+
"model_preset": "mimic",
|
| 46 |
+
"run_name": "fox-20260414-relpos"
|
| 47 |
}
|
fox/metadata.json
CHANGED
|
@@ -1,16 +1,16 @@
|
|
| 1 |
{
|
| 2 |
"character": "Fox",
|
| 3 |
"melee_enum": "FOX",
|
| 4 |
-
"run_name": "fox-
|
| 5 |
-
"global_step":
|
| 6 |
"games_trained": 17319,
|
| 7 |
-
"val_btn_f1": "87.
|
| 8 |
"val_main_f1": "~55%",
|
| 9 |
"val_loss": "0.77",
|
| 10 |
-
"n_params":
|
| 11 |
"n_controller_combos": 7,
|
| 12 |
-
"model_preset": "
|
| 13 |
-
"pos_enc": "
|
| 14 |
"no_self_inputs": false,
|
| 15 |
-
"training_notes": "Trained 2026-04-
|
| 16 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"character": "Fox",
|
| 3 |
"melee_enum": "FOX",
|
| 4 |
+
"run_name": "fox-20260414-relpos",
|
| 5 |
+
"global_step": 55692,
|
| 6 |
"games_trained": 17319,
|
| 7 |
+
"val_btn_f1": "87.1%",
|
| 8 |
"val_main_f1": "~55%",
|
| 9 |
"val_loss": "0.77",
|
| 10 |
+
"n_params": 26276389,
|
| 11 |
"n_controller_combos": 7,
|
| 12 |
+
"model_preset": "mimic",
|
| 13 |
+
"pos_enc": "relpos",
|
| 14 |
"no_self_inputs": false,
|
| 15 |
+
"training_notes": "Trained 2026-04-14, fox-20260414-relpos run. v2 shards, Shaw relative-position attention (mimic preset), --self-inputs, dropout 0.2, 65K steps at batch 512 (2x the standard schedule). Replaces the yesterday's RoPE Fox, which matched this on val metrics but relpos won the 2026-04-14 sweep on Falco so we standardized on it for all new runs. Best checkpoint is the step 55692 snapshot, closest to the lowest measured val loss."
|
| 16 |
}
|
fox/model.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03c11167493e4dbf11c8871135e82194714edde9ca522fd656cd008e9e74436d
|
| 3 |
+
size 265142496
|