final: baseline fixed1k + sampled synth (T=5, B=2000, lr=2e-05, gas=16)
Browse files- config.json +1 -1
- model-00001-of-00003.safetensors +2 -2
- model-00002-of-00003.safetensors +1 -1
- model-00003-of-00003.safetensors +1 -1
- model.safetensors.index.json +2 -2
config.json
CHANGED
|
@@ -39,5 +39,5 @@
|
|
| 39 |
"transformers_version": "4.57.3",
|
| 40 |
"type_vocab_size": 0,
|
| 41 |
"use_cache": false,
|
| 42 |
-
"vocab_size":
|
| 43 |
}
|
|
|
|
| 39 |
"transformers_version": "4.57.3",
|
| 40 |
"type_vocab_size": 0,
|
| 41 |
"use_cache": false,
|
| 42 |
+
"vocab_size": 128001
|
| 43 |
}
|
model-00001-of-00003.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a52010352accd4fe1bd12fae41ba72dddc9d6e0d2ad15d8fe4d813468203b36
|
| 3 |
+
size 393219224
|
model-00002-of-00003.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 198480360
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bbe64048d990a442da1c3f9541f7be90e9dd44bba6412d70319a6ef17c10c78a
|
| 3 |
size 198480360
|
model-00003-of-00003.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 145712228
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e93ee22ff8b9ae3883a2118c673e7512d8569d2aa3186f1310cce3842e3b1a5
|
| 3 |
size 145712228
|
model.safetensors.index.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
-
"total_parameters":
|
| 4 |
-
"total_size":
|
| 5 |
},
|
| 6 |
"weight_map": {
|
| 7 |
"classifier.bias": "model-00003-of-00003.safetensors",
|
|
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
+
"total_parameters": 184346881,
|
| 4 |
+
"total_size": 737387524
|
| 5 |
},
|
| 6 |
"weight_map": {
|
| 7 |
"classifier.bias": "model-00003-of-00003.safetensors",
|