erickfm commited on
Commit
f5d1cd7
·
verified ·
1 Parent(s): 97ccaa3

Upload MIMIC character checkpoints + model card

Browse files
Files changed (4) hide show
  1. README.md +1 -4
  2. fox/config.json +10 -7
  3. fox/metadata.json +7 -7
  4. fox/model.pt +2 -2
README.md CHANGED
@@ -34,10 +34,7 @@ outputs controller inputs (main stick, c-stick, shoulder, buttons) at 60 Hz.
34
 
35
  | Character | Games | Val btn F1 | Val main F1 | Val loss | Step |
36
  |---|---|---|---|---|---|
37
- | **Fox** | 17,319 | 87.7% | ~55% | 0.77 | 31,065 |
38
- | **Falco** | 9,110 | 88.2% | 58.5% | 0.68 | 28,122 |
39
- | **Captain Falcon** | 9,404 | 89.9% | 52.2% | 0.71 | 26,814 |
40
- | **Luigi** | 1,951 | ~91% | ~60% | ~1.0 | 5,242 |
41
 
42
  ## Repo layout
43
 
 
34
 
35
  | Character | Games | Val btn F1 | Val main F1 | Val loss | Step |
36
  |---|---|---|---|---|---|
37
+ | **Fox** | 17,319 | 87.1% | ~55% | 0.77 | 55,692 |
 
 
 
38
 
39
  ## Repo layout
40
 
fox/config.json CHANGED
@@ -3,14 +3,14 @@
3
  "nhead": 8,
4
  "num_layers": 6,
5
  "dim_feedforward": 2048,
6
- "dropout": 0.1,
7
- "encoder_type": "hal_flat",
8
  "d_intra": 256,
9
  "encoder_nlayers": 2,
10
  "k_query": 1,
11
  "scaled_emb": false,
12
  "max_seq_len": 256,
13
- "pos_enc": "rope",
14
  "rope_theta": 10000.0,
15
  "rope_learnable_freqs": false,
16
  "xpos_scale_base": 0.0,
@@ -26,11 +26,14 @@
26
  "n_stick_clusters": 37,
27
  "n_shoulder_bins": 3,
28
  "autoregressive_heads": true,
29
- "hal_mode": true,
30
  "lean_features": false,
 
 
 
 
31
  "hal_minimal_features": true,
32
  "hal_controller_encoding": true,
33
- "n_controller_combos": 7,
34
  "num_stages": 6,
35
  "num_ports": 4,
36
  "num_characters": 27,
@@ -39,6 +42,6 @@
39
  "num_c_dirs": 9,
40
  "num_proj_types": 103,
41
  "num_proj_subtypes": 40,
42
- "model_preset": "hal-rope",
43
- "run_name": "fox-rope-v2"
44
  }
 
3
  "nhead": 8,
4
  "num_layers": 6,
5
  "dim_feedforward": 2048,
6
+ "dropout": 0.2,
7
+ "encoder_type": "mimic_flat",
8
  "d_intra": 256,
9
  "encoder_nlayers": 2,
10
  "k_query": 1,
11
  "scaled_emb": false,
12
  "max_seq_len": 256,
13
+ "pos_enc": "relpos",
14
  "rope_theta": 10000.0,
15
  "rope_learnable_freqs": false,
16
  "xpos_scale_base": 0.0,
 
26
  "n_stick_clusters": 37,
27
  "n_shoulder_bins": 3,
28
  "autoregressive_heads": true,
29
+ "mimic_mode": true,
30
  "lean_features": false,
31
+ "mimic_minimal_features": true,
32
+ "mimic_controller_encoding": true,
33
+ "n_controller_combos": 7,
34
+ "hal_mode": true,
35
  "hal_minimal_features": true,
36
  "hal_controller_encoding": true,
 
37
  "num_stages": 6,
38
  "num_ports": 4,
39
  "num_characters": 27,
 
42
  "num_c_dirs": 9,
43
  "num_proj_types": 103,
44
  "num_proj_subtypes": 40,
45
+ "model_preset": "mimic",
46
+ "run_name": "fox-20260414-relpos"
47
  }
fox/metadata.json CHANGED
@@ -1,16 +1,16 @@
1
  {
2
  "character": "Fox",
3
  "melee_enum": "FOX",
4
- "run_name": "fox-rope-v2",
5
- "global_step": 31065,
6
  "games_trained": 17319,
7
- "val_btn_f1": "87.7%",
8
  "val_main_f1": "~55%",
9
  "val_loss": "0.77",
10
- "n_params": 19591909,
11
  "n_controller_combos": 7,
12
- "model_preset": "hal-rope",
13
- "pos_enc": "rope",
14
  "no_self_inputs": false,
15
- "training_notes": "Trained 2026-04-13, fox-rope-v2 run. v2 shards, RoPE position encoding (hal-rope preset), --self-inputs, dropout 0.1, 32K steps at batch 512. Replaces the legacy hal-7class-v2-long checkpoint which was trained without --self-inputs and stuck at val loss 2.27. The self-inputs flag was the real fix \u2014 RoPE vs relpos is secondary. Metrics land alongside Falco/CptFalcon/Luigi."
16
  }
 
1
  {
2
  "character": "Fox",
3
  "melee_enum": "FOX",
4
+ "run_name": "fox-20260414-relpos",
5
+ "global_step": 55692,
6
  "games_trained": 17319,
7
+ "val_btn_f1": "87.1%",
8
  "val_main_f1": "~55%",
9
  "val_loss": "0.77",
10
+ "n_params": 26276389,
11
  "n_controller_combos": 7,
12
+ "model_preset": "mimic",
13
+ "pos_enc": "relpos",
14
  "no_self_inputs": false,
15
+ "training_notes": "Trained 2026-04-14, fox-20260414-relpos run. v2 shards, Shaw relative-position attention (mimic preset), --self-inputs, dropout 0.2, 65K steps at batch 512 (2x the standard schedule). Replaces the yesterday's RoPE Fox, which matched this on val metrics but relpos won the 2026-04-14 sweep on Falco so we standardized on it for all new runs. Best checkpoint is the step 55692 snapshot, closest to the lowest measured val loss."
16
  }
fox/model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41ee9f42c3f5c8d03dfe799e2e8b08a142a88fe3328e295e99ebcf855162def0
3
- size 235274570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03c11167493e4dbf11c8871135e82194714edde9ca522fd656cd008e9e74436d
3
+ size 265142496