kiritan commited on
Commit
d7879fb
·
verified ·
1 Parent(s): 4c84a39

Training in progress, step 4000, checkpoint

Browse files
last-checkpoint/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "./iteboshi",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
 
1
  {
2
+ "_name_or_path": "./iteboshi_student_model",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
last-checkpoint/global_step4000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4925e56c9d2a00e9f473e8c7645b3d0a3a4e41097d4c8ce171f7a098a8a8abc3
3
+ size 5117197489
last-checkpoint/global_step4000/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:228d3b5d3dd5cdd6840987df23e85f2d1dbf381652d22076d85ffd17dc6cfe91
3
+ size 859127933
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step20000
 
1
+ global_step4000
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:069fbc2b96ff55558de2b6621d0406b4fbcbc7edffe8d2472bb8b992e0abdb14
3
  size 962205216
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9783304ccc30a2ca3ef8ee2b6028590101d0883ace79912368fe45d258f448da
3
  size 962205216
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef2e75134b208d60f6f9b30cef29e49813797dfcda4ce7d7e2cabca76bb3fa47
3
- size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1738051805633f2dae2cb76862a890f5315dec48d62792eb30d467b255aa9375
3
+ size 14709
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29c7a79b53a589de48d3b7a21df9c0d024be4dea79f68869f72fdc01ae3b212a
3
- size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39633b2dde2fc370ba24b3ba0a39e36a540c9e698e671d01c13867edb1102dc8
3
+ size 1465
last-checkpoint/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
last-checkpoint/trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff
 
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:141b47c9f24722722f87d8aaea6f79b4802e8fd4d3cc397deb797bdcbf425c80
3
- size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cddc2dca74f30db07f7eb32e15dbc2c9754c5c53b06aa493b2582deab8dfd7f
3
+ size 7249
last-checkpoint/vocab.json CHANGED
The diff for this file is too large to render. See raw diff