erickfm commited on
Commit
155d0fe
·
verified ·
1 Parent(s): a30bee7

Upload MIMIC character checkpoints + model card

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. fox/config.json +5 -5
  3. fox/metadata.json +10 -10
  4. fox/model.pt +2 -2
README.md CHANGED
@@ -34,7 +34,7 @@ outputs controller inputs (main stick, c-stick, shoulder, buttons) at 60 Hz.
34
 
35
  | Character | Games | Val btn F1 | Val main F1 | Val loss | Step |
36
  |---|---|---|---|---|---|
37
- | **Fox** | 17,319 | ~59% | ~15% | 2.27 | 28,165 |
38
  | **Falco** | 9,110 | 88.2% | 58.5% | 0.68 | 28,122 |
39
  | **Captain Falcon** | 9,404 | 89.9% | 52.2% | 0.71 | 26,814 |
40
  | **Luigi** | 1,951 | ~91% | ~60% | ~1.0 | 5,242 |
 
34
 
35
  | Character | Games | Val btn F1 | Val main F1 | Val loss | Step |
36
  |---|---|---|---|---|---|
37
+ | **Fox** | 17,319 | 87.7% | ~55% | 0.77 | 31,065 |
38
  | **Falco** | 9,110 | 88.2% | 58.5% | 0.68 | 28,122 |
39
  | **Captain Falcon** | 9,404 | 89.9% | 52.2% | 0.71 | 26,814 |
40
  | **Luigi** | 1,951 | ~91% | ~60% | ~1.0 | 5,242 |
fox/config.json CHANGED
@@ -3,14 +3,14 @@
3
  "nhead": 8,
4
  "num_layers": 6,
5
  "dim_feedforward": 2048,
6
- "dropout": 0.2,
7
  "encoder_type": "hal_flat",
8
  "d_intra": 256,
9
  "encoder_nlayers": 2,
10
  "k_query": 1,
11
  "scaled_emb": false,
12
  "max_seq_len": 256,
13
- "pos_enc": "relpos",
14
  "rope_theta": 10000.0,
15
  "rope_learnable_freqs": false,
16
  "xpos_scale_base": 0.0,
@@ -21,7 +21,7 @@
21
  "stick_loss": "clusters",
22
  "btn_loss": "focal",
23
  "no_opp_inputs": true,
24
- "no_self_inputs": true,
25
  "head_hidden": 256,
26
  "n_stick_clusters": 37,
27
  "n_shoulder_bins": 3,
@@ -39,6 +39,6 @@
39
  "num_c_dirs": 9,
40
  "num_proj_types": 103,
41
  "num_proj_subtypes": 40,
42
- "model_preset": "hal",
43
- "run_name": "hal-7class-v2-long"
44
  }
 
3
  "nhead": 8,
4
  "num_layers": 6,
5
  "dim_feedforward": 2048,
6
+ "dropout": 0.1,
7
  "encoder_type": "hal_flat",
8
  "d_intra": 256,
9
  "encoder_nlayers": 2,
10
  "k_query": 1,
11
  "scaled_emb": false,
12
  "max_seq_len": 256,
13
+ "pos_enc": "rope",
14
  "rope_theta": 10000.0,
15
  "rope_learnable_freqs": false,
16
  "xpos_scale_base": 0.0,
 
21
  "stick_loss": "clusters",
22
  "btn_loss": "focal",
23
  "no_opp_inputs": true,
24
+ "no_self_inputs": false,
25
  "head_hidden": 256,
26
  "n_stick_clusters": 37,
27
  "n_shoulder_bins": 3,
 
39
  "num_c_dirs": 9,
40
  "num_proj_types": 103,
41
  "num_proj_subtypes": 40,
42
+ "model_preset": "hal-rope",
43
+ "run_name": "fox-rope-v2"
44
  }
fox/metadata.json CHANGED
@@ -1,16 +1,16 @@
1
  {
2
  "character": "Fox",
3
  "melee_enum": "FOX",
4
- "run_name": "hal-7class-v2-long",
5
- "global_step": 28165,
6
  "games_trained": 17319,
7
- "val_btn_f1": "~59%",
8
- "val_main_f1": "~15%",
9
- "val_loss": "2.27",
10
- "n_params": 26247717,
11
  "n_controller_combos": 7,
12
- "model_preset": "hal",
13
- "pos_enc": "relpos",
14
- "no_self_inputs": true,
15
- "training_notes": "Legacy checkpoint from the 2026-04-11 hal-7class-v2-long run. Trained WITHOUT --self-inputs, which is why the val metrics look much lower than the other characters. Still plays actively in Dolphin but performance is below the Falco/CptFalcon/Luigi models. A new Fox run with --self-inputs is a todo."
16
  }
 
1
  {
2
  "character": "Fox",
3
  "melee_enum": "FOX",
4
+ "run_name": "fox-rope-v2",
5
+ "global_step": 31065,
6
  "games_trained": 17319,
7
+ "val_btn_f1": "87.7%",
8
+ "val_main_f1": "~55%",
9
+ "val_loss": "0.77",
10
+ "n_params": 19591909,
11
  "n_controller_combos": 7,
12
+ "model_preset": "hal-rope",
13
+ "pos_enc": "rope",
14
+ "no_self_inputs": false,
15
+ "training_notes": "Trained 2026-04-13, fox-rope-v2 run. v2 shards, RoPE position encoding (hal-rope preset), --self-inputs, dropout 0.1, 32K steps at batch 512. Replaces the legacy hal-7class-v2-long checkpoint which was trained without --self-inputs and stuck at val loss 2.27. The self-inputs flag was the real fix \u2014 RoPE vs relpos is secondary. Metrics land alongside Falco/CptFalcon/Luigi."
16
  }
fox/model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7bcb0d0b3d4a0cddcf18887cc9deee36a2910cafa5fca4b0a360cae68f04c20
3
- size 264795225
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41ee9f42c3f5c8d03dfe799e2e8b08a142a88fe3328e295e99ebcf855162def0
3
+ size 235274570