Upload trainer_0/config.json with huggingface_hub
Browse files- trainer_0/config.json +2 -2
trainer_0/config.json
CHANGED
|
@@ -10,7 +10,7 @@
|
|
| 10 |
"threshold_beta": 0.999,
|
| 11 |
"threshold_start_step": 1000,
|
| 12 |
"seed": null,
|
| 13 |
-
"activation_dim":
|
| 14 |
"dict_size": 16384,
|
| 15 |
"k": 128,
|
| 16 |
"device": "cuda:0",
|
|
@@ -20,7 +20,7 @@
|
|
| 20 |
"submodule_name": null
|
| 21 |
},
|
| 22 |
"buffer": {
|
| 23 |
-
"n_models":
|
| 24 |
"d_submodule": 512,
|
| 25 |
"io": "out",
|
| 26 |
"n_ctxs": 512,
|
|
|
|
| 10 |
"threshold_beta": 0.999,
|
| 11 |
"threshold_start_step": 1000,
|
| 12 |
"seed": null,
|
| 13 |
+
"activation_dim": 6144,
|
| 14 |
"dict_size": 16384,
|
| 15 |
"k": 128,
|
| 16 |
"device": "cuda:0",
|
|
|
|
| 20 |
"submodule_name": null
|
| 21 |
},
|
| 22 |
"buffer": {
|
| 23 |
+
"n_models": 12,
|
| 24 |
"d_submodule": 512,
|
| 25 |
"io": "out",
|
| 26 |
"n_ctxs": 512,
|