erickfm commited on
Commit
39e2386
·
verified ·
1 Parent(s): b7a8aec

Update puff checkpoint + metadata

Browse files
Files changed (3) hide show
  1. puff/config.json +10 -9
  2. puff/metadata.json +10 -10
  3. puff/model.pt +2 -2
puff/config.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "d_model": 768,
3
- "nhead": 12,
4
- "num_layers": 6,
5
- "dim_feedforward": 3072,
6
  "dropout": 0.1,
7
  "encoder_type": "mimic_flat",
8
  "d_intra": 256,
@@ -17,7 +17,8 @@
17
  "attn_variant": "standard",
18
  "n_kv_heads": 0,
19
  "use_rmsnorm": false,
20
- "use_swiglu": true,
 
21
  "stick_loss": "clusters",
22
  "btn_loss": "focal",
23
  "no_opp_inputs": true,
@@ -28,11 +29,11 @@
28
  "autoregressive_heads": true,
29
  "mimic_mode": true,
30
  "lean_features": false,
31
- "mimic_minimal_features": true,
32
  "mimic_controller_encoding": true,
33
  "n_controller_combos": 7,
34
  "hal_mode": true,
35
- "hal_minimal_features": true,
36
  "hal_controller_encoding": true,
37
  "num_stages": 6,
38
  "num_ports": 4,
@@ -42,6 +43,6 @@
42
  "num_c_dirs": 9,
43
  "num_proj_types": 103,
44
  "num_proj_subtypes": 40,
45
- "model_preset": "mimic-xl",
46
- "run_name": "puff-20260418-relpos-xl"
47
  }
 
1
  {
2
+ "d_model": 1024,
3
+ "nhead": 16,
4
+ "num_layers": 12,
5
+ "dim_feedforward": 4096,
6
  "dropout": 0.1,
7
  "encoder_type": "mimic_flat",
8
  "d_intra": 256,
 
17
  "attn_variant": "standard",
18
  "n_kv_heads": 0,
19
  "use_rmsnorm": false,
20
+ "use_swiglu": false,
21
+ "use_input_gate": false,
22
  "stick_loss": "clusters",
23
  "btn_loss": "focal",
24
  "no_opp_inputs": true,
 
29
  "autoregressive_heads": true,
30
  "mimic_mode": true,
31
  "lean_features": false,
32
+ "mimic_minimal_features": false,
33
  "mimic_controller_encoding": true,
34
  "n_controller_combos": 7,
35
  "hal_mode": true,
36
+ "hal_minimal_features": false,
37
  "hal_controller_encoding": true,
38
  "num_stages": 6,
39
  "num_ports": 4,
 
43
  "num_c_dirs": 9,
44
  "num_proj_types": 103,
45
  "num_proj_subtypes": 40,
46
+ "model_preset": "mimic-xxl",
47
+ "run_name": "puff-20260419-mimic-xxl"
48
  }
puff/metadata.json CHANGED
@@ -1,16 +1,16 @@
1
  {
2
  "character": "Jigglypuff",
3
  "melee_enum": "JIGGLYPUFF",
4
- "run_name": "puff-20260418-relpos-xl",
5
- "global_step": 29757,
6
- "games_trained": 33585,
7
- "val_btn_f1": "91.3%",
8
- "val_main_f1": "51.7%",
9
- "val_loss": "0.6766",
10
- "n_params": 50590757,
11
  "n_controller_combos": 7,
12
- "model_preset": "mimic-xl",
13
  "pos_enc": "relpos",
14
- "no_self_inputs": false,
15
- "training_notes": "Trained 2026-04-18 on the full Puff HuggingFace set (33,327 .slp files \u2192 33,585 games after quality filters, 168 \u00d7 4GB shards). v2 shards, relpos attention, --self-inputs, 32,768 steps at eff_bs 512 in 83 min on 2\u00d7RTX 5090. Uses the `mimic-xl` preset: d_model=768, 6 layers, 12 heads, d_ff=3072, SwiGLU FFN, dropout 0.1 \u2014 ~44M params, a 2.2\u00d7 scaled-up variant of the standard `mimic` preset. Beat the matching standard-size puff baseline (val 0.6890) by 1.8% (run qeka6rq8 would be an apples-to-apples reference run for capacity comparisons)."
 
 
 
 
16
  }
 
1
  {
2
  "character": "Jigglypuff",
3
  "melee_enum": "JIGGLYPUFF",
4
+ "run_name": "puff-20260419-mimic-xxl",
5
+ "global_step": 30738,
6
+ "n_params": 166949413,
 
 
 
 
7
  "n_controller_combos": 7,
8
+ "model_preset": "mimic-xxl",
9
  "pos_enc": "relpos",
10
+ "val_loss": "0.6432",
11
+ "best_step": 30738,
12
+ "val_btn_f1": "91.4%",
13
+ "val_main_f1": "53.3%",
14
+ "val_shldr_f1": "91.0%",
15
+ "val_cdir_f1": "68.7%"
16
  }
puff/model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65fdc96b775bf0efd240fc76cc194fd4d8f3a8ec2a5e31f5cdc429a970ad2107
3
- size 556909050
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0bcad2e1f0250c07a4574aa346e73556d30c71306a1ff76563e45c21ba920ad
3
+ size 1902993716