Update falco checkpoint + metadata
Browse files- falco/config.json +10 -9
- falco/metadata.json +10 -10
- falco/model.pt +2 -2
falco/config.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
{
|
| 2 |
-
"d_model":
|
| 3 |
-
"nhead":
|
| 4 |
-
"num_layers":
|
| 5 |
-
"dim_feedforward":
|
| 6 |
-
"dropout": 0.
|
| 7 |
"encoder_type": "mimic_flat",
|
| 8 |
"d_intra": 256,
|
| 9 |
"encoder_nlayers": 2,
|
|
@@ -18,6 +18,7 @@
|
|
| 18 |
"n_kv_heads": 0,
|
| 19 |
"use_rmsnorm": false,
|
| 20 |
"use_swiglu": false,
|
|
|
|
| 21 |
"stick_loss": "clusters",
|
| 22 |
"btn_loss": "focal",
|
| 23 |
"no_opp_inputs": true,
|
|
@@ -28,11 +29,11 @@
|
|
| 28 |
"autoregressive_heads": true,
|
| 29 |
"mimic_mode": true,
|
| 30 |
"lean_features": false,
|
| 31 |
-
"mimic_minimal_features":
|
| 32 |
"mimic_controller_encoding": true,
|
| 33 |
"n_controller_combos": 7,
|
| 34 |
"hal_mode": true,
|
| 35 |
-
"hal_minimal_features":
|
| 36 |
"hal_controller_encoding": true,
|
| 37 |
"num_stages": 6,
|
| 38 |
"num_ports": 4,
|
|
@@ -42,6 +43,6 @@
|
|
| 42 |
"num_c_dirs": 9,
|
| 43 |
"num_proj_types": 103,
|
| 44 |
"num_proj_subtypes": 40,
|
| 45 |
-
"model_preset": "mimic",
|
| 46 |
-
"run_name": "falco-
|
| 47 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"d_model": 1024,
|
| 3 |
+
"nhead": 16,
|
| 4 |
+
"num_layers": 12,
|
| 5 |
+
"dim_feedforward": 4096,
|
| 6 |
+
"dropout": 0.1,
|
| 7 |
"encoder_type": "mimic_flat",
|
| 8 |
"d_intra": 256,
|
| 9 |
"encoder_nlayers": 2,
|
|
|
|
| 18 |
"n_kv_heads": 0,
|
| 19 |
"use_rmsnorm": false,
|
| 20 |
"use_swiglu": false,
|
| 21 |
+
"use_input_gate": false,
|
| 22 |
"stick_loss": "clusters",
|
| 23 |
"btn_loss": "focal",
|
| 24 |
"no_opp_inputs": true,
|
|
|
|
| 29 |
"autoregressive_heads": true,
|
| 30 |
"mimic_mode": true,
|
| 31 |
"lean_features": false,
|
| 32 |
+
"mimic_minimal_features": false,
|
| 33 |
"mimic_controller_encoding": true,
|
| 34 |
"n_controller_combos": 7,
|
| 35 |
"hal_mode": true,
|
| 36 |
+
"hal_minimal_features": false,
|
| 37 |
"hal_controller_encoding": true,
|
| 38 |
"num_stages": 6,
|
| 39 |
"num_ports": 4,
|
|
|
|
| 43 |
"num_c_dirs": 9,
|
| 44 |
"num_proj_types": 103,
|
| 45 |
"num_proj_subtypes": 40,
|
| 46 |
+
"model_preset": "mimic-xxl",
|
| 47 |
+
"run_name": "falco-20260419-xxl"
|
| 48 |
}
|
falco/metadata.json
CHANGED
|
@@ -1,16 +1,16 @@
|
|
| 1 |
{
|
| 2 |
"character": "Falco",
|
| 3 |
"melee_enum": "FALCO",
|
| 4 |
-
"run_name": "falco-
|
| 5 |
-
"global_step":
|
| 6 |
-
"n_params":
|
| 7 |
"n_controller_combos": 7,
|
| 8 |
-
"model_preset": "mimic",
|
| 9 |
"pos_enc": "relpos",
|
| 10 |
-
"val_loss": "
|
| 11 |
-
"best_step":
|
| 12 |
-
"val_btn_f1": "88.
|
| 13 |
-
"val_main_f1": "
|
| 14 |
-
"val_shldr_f1": "
|
| 15 |
-
"val_cdir_f1": "
|
| 16 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"character": "Falco",
|
| 3 |
"melee_enum": "FALCO",
|
| 4 |
+
"run_name": "falco-20260419-xxl",
|
| 5 |
+
"global_step": 7521,
|
| 6 |
+
"n_params": 166949413,
|
| 7 |
"n_controller_combos": 7,
|
| 8 |
+
"model_preset": "mimic-xxl",
|
| 9 |
"pos_enc": "relpos",
|
| 10 |
+
"val_loss": "?",
|
| 11 |
+
"best_step": null,
|
| 12 |
+
"val_btn_f1": "88.1%",
|
| 13 |
+
"val_main_f1": "55.9%",
|
| 14 |
+
"val_shldr_f1": "86.2%",
|
| 15 |
+
"val_cdir_f1": "59.9%"
|
| 16 |
}
|
falco/model.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7dee47df65c356a63139ab7206d2fed035bd3154880bb2839b58e563ba9826f6
|
| 3 |
+
size 1902989881
|