Add Puff (Jigglypuff) checkpoint: mimic-xl (768d/6L/12h/SwiGLU) val 0.6766

Files changed (3) hide show

puff/config.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
-  "d_model": 512,
-  "nhead": 8,
   "num_layers": 6,
-  "dim_feedforward": 2048,
-  "dropout": 0.2,
   "encoder_type": "mimic_flat",
   "d_intra": 256,
   "encoder_nlayers": 2,
@@ -17,7 +17,7 @@
   "attn_variant": "standard",
   "n_kv_heads": 0,
   "use_rmsnorm": false,
-  "use_swiglu": false,
   "stick_loss": "clusters",
   "btn_loss": "focal",
   "no_opp_inputs": true,
@@ -42,6 +42,6 @@
   "num_c_dirs": 9,
   "num_proj_types": 103,
   "num_proj_subtypes": 40,
-  "model_preset": "mimic",
-  "run_name": "puff-20260417-relpos"
 }

 {
+  "d_model": 768,
+  "nhead": 12,
   "num_layers": 6,
+  "dim_feedforward": 3072,
+  "dropout": 0.1,
   "encoder_type": "mimic_flat",
   "d_intra": 256,
   "encoder_nlayers": 2,
   "attn_variant": "standard",
   "n_kv_heads": 0,
   "use_rmsnorm": false,
+  "use_swiglu": true,
   "stick_loss": "clusters",
   "btn_loss": "focal",
   "no_opp_inputs": true,
   "num_c_dirs": 9,
   "num_proj_types": 103,
   "num_proj_subtypes": 40,
+  "model_preset": "mimic-xl",
+  "run_name": "puff-20260418-relpos-xl"
 }

puff/metadata.json CHANGED Viewed

@@ -1,16 +1,16 @@
 {
   "character": "Jigglypuff",
   "melee_enum": "JIGGLYPUFF",
-  "run_name": "puff-20260417-relpos",
-  "global_step": 32373,
-  "n_params": 26276389,
   "n_controller_combos": 7,
-  "model_preset": "mimic",
   "pos_enc": "relpos",
-  "val_loss": "0.6890",
-  "best_step": 32373,
-  "val_btn_f1": "91.3%",
-  "val_main_f1": "52.2%",
-  "val_shldr_f1": "91.7%",
-  "val_cdir_f1": "70.6%"
 }

 {
   "character": "Jigglypuff",
   "melee_enum": "JIGGLYPUFF",
+  "run_name": "puff-20260418-relpos-xl",
+  "global_step": 29757,
+  "games_trained": 33585,
+  "val_btn_f1": "91.3%",
+  "val_main_f1": "51.7%",
+  "val_loss": "0.6766",
+  "n_params": 50590757,
   "n_controller_combos": 7,
+  "model_preset": "mimic-xl",
   "pos_enc": "relpos",
+  "no_self_inputs": false,
+  "training_notes": "Trained 2026-04-18 on the full Puff HuggingFace set (33,327 .slp files \u2192 33,585 games after quality filters, 168 \u00d7 4GB shards). v2 shards, relpos attention, --self-inputs, 32,768 steps at eff_bs 512 in 83 min on 2\u00d7RTX 5090. Uses the `mimic-xl` preset: d_model=768, 6 layers, 12 heads, d_ff=3072, SwiGLU FFN, dropout 0.1 \u2014 ~44M params, a 2.2\u00d7 scaled-up variant of the standard `mimic` preset. Beat the matching standard-size puff baseline (val 0.6890) by 1.8% (run qeka6rq8 would be an apples-to-apples reference run for capacity comparisons)."
 }

puff/model.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:140439d5daac2a0294f614c8e650d0e41a42095bac342ce223792b6e9dc41e06
-size 265142047

 version https://git-lfs.github.com/spec/v1
+oid sha256:65fdc96b775bf0efd240fc76cc194fd4d8f3a8ec2a5e31f5cdc429a970ad2107
+size 556909050