Training in progress, step 4000, checkpoint
Browse files- last-checkpoint/config.json +1 -1
- last-checkpoint/global_step4000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step4000/mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/model.safetensors +1 -1
- last-checkpoint/rng_state.pth +2 -2
- last-checkpoint/scheduler.pt +2 -2
- last-checkpoint/tokenizer.json +0 -0
- last-checkpoint/trainer_state.json +0 -0
- last-checkpoint/training_args.bin +2 -2
- last-checkpoint/vocab.json +0 -0
last-checkpoint/config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "./
|
| 3 |
"activation_dropout": 0.0,
|
| 4 |
"activation_function": "gelu",
|
| 5 |
"apply_spec_augment": false,
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "./iteboshi_student_model",
|
| 3 |
"activation_dropout": 0.0,
|
| 4 |
"activation_function": "gelu",
|
| 5 |
"apply_spec_augment": false,
|
last-checkpoint/global_step4000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4925e56c9d2a00e9f473e8c7645b3d0a3a4e41097d4c8ce171f7a098a8a8abc3
|
| 3 |
+
size 5117197489
|
last-checkpoint/global_step4000/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:228d3b5d3dd5cdd6840987df23e85f2d1dbf381652d22076d85ffd17dc6cfe91
|
| 3 |
+
size 859127933
|
last-checkpoint/latest
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
|
|
|
|
| 1 |
+
global_step4000
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 962205216
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9783304ccc30a2ca3ef8ee2b6028590101d0883ace79912368fe45d258f448da
|
| 3 |
size 962205216
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1738051805633f2dae2cb76862a890f5315dec48d62792eb30d467b255aa9375
|
| 3 |
+
size 14709
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:39633b2dde2fc370ba24b3ba0a39e36a540c9e698e671d01c13867edb1102dc8
|
| 3 |
+
size 1465
|
last-checkpoint/tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
last-checkpoint/trainer_state.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
last-checkpoint/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5cddc2dca74f30db07f7eb32e15dbc2c9754c5c53b06aa493b2582deab8dfd7f
|
| 3 |
+
size 7249
|
last-checkpoint/vocab.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|