Upload 3 files
Browse files- model.safetensors +1 -1
- optimizer.pt +1 -1
- training_state.json +3 -3
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 549501112
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3fad293a94f2815270a7e0c524f7048031bb65cf2b3062cbb727b3da2d4d4aa9
|
| 3 |
size 549501112
|
optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1099075450
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f76dd2ea2642a355e77a15fe5d685453fb825348924df8d46ed6aeee32fb238
|
| 3 |
size 1099075450
|
training_state.json
CHANGED
|
@@ -1,11 +1,11 @@
|
|
| 1 |
{
|
| 2 |
-
"step":
|
| 3 |
-
"epoch":
|
| 4 |
"vocab_size": 30574,
|
| 5 |
"model_vocab_size": 30592,
|
| 6 |
"config": {
|
| 7 |
"optimizer_type": "adamw",
|
| 8 |
-
"lr":
|
| 9 |
"weight_decay": 0.01,
|
| 10 |
"warmup_steps": 8000,
|
| 11 |
"scheduler_type": "cosine",
|
|
|
|
| 1 |
{
|
| 2 |
+
"step": 1050000,
|
| 3 |
+
"epoch": 27,
|
| 4 |
"vocab_size": 30574,
|
| 5 |
"model_vocab_size": 30592,
|
| 6 |
"config": {
|
| 7 |
"optimizer_type": "adamw",
|
| 8 |
+
"lr": 0.0001,
|
| 9 |
"weight_decay": 0.01,
|
| 10 |
"warmup_steps": 8000,
|
| 11 |
"scheduler_type": "cosine",
|