Training in progress, step 300, checkpoint
Browse files- checkpoint-300/adapter_config.json +4 -4
- checkpoint-300/adapter_model.safetensors +1 -1
- checkpoint-300/global_step300/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +1 -1
- checkpoint-300/global_step300/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +1 -1
- checkpoint-300/global_step300/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +1 -1
- checkpoint-300/global_step300/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +1 -1
- checkpoint-300/global_step300/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +1 -1
- checkpoint-300/global_step300/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +1 -1
- checkpoint-300/global_step300/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +1 -1
- checkpoint-300/global_step300/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +1 -1
- checkpoint-300/global_step300/mp_rank_00_model_states.pt +1 -1
- checkpoint-300/rng_state_0.pth +2 -2
- checkpoint-300/rng_state_1.pth +2 -2
- checkpoint-300/rng_state_2.pth +1 -1
- checkpoint-300/rng_state_3.pth +1 -1
- checkpoint-300/rng_state_4.pth +2 -2
- checkpoint-300/rng_state_5.pth +1 -1
- checkpoint-300/rng_state_6.pth +2 -2
- checkpoint-300/rng_state_7.pth +2 -2
- checkpoint-300/trainer_state.json +0 -0
- checkpoint-300/training_args.bin +1 -1
checkpoint-300/adapter_config.json
CHANGED
|
@@ -24,13 +24,13 @@
|
|
| 24 |
"rank_pattern": {},
|
| 25 |
"revision": null,
|
| 26 |
"target_modules": [
|
| 27 |
-
"
|
| 28 |
"up_proj",
|
| 29 |
"gate_proj",
|
| 30 |
"v_proj",
|
| 31 |
-
"
|
| 32 |
-
"
|
| 33 |
-
"
|
| 34 |
],
|
| 35 |
"task_type": "CAUSAL_LM",
|
| 36 |
"trainable_token_indices": null,
|
|
|
|
| 24 |
"rank_pattern": {},
|
| 25 |
"revision": null,
|
| 26 |
"target_modules": [
|
| 27 |
+
"k_proj",
|
| 28 |
"up_proj",
|
| 29 |
"gate_proj",
|
| 30 |
"v_proj",
|
| 31 |
+
"down_proj",
|
| 32 |
+
"o_proj",
|
| 33 |
+
"q_proj"
|
| 34 |
],
|
| 35 |
"task_type": "CAUSAL_LM",
|
| 36 |
"trainable_token_indices": null,
|
checkpoint-300/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 335580296
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a81d4fdf0d3d71cad6c4494b85579c3562173e08a8516df716a458db975ee4ba
|
| 3 |
size 335580296
|
checkpoint-300/global_step300/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665797
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bb27a1f5a7881736fedbf6dab589af4b59a6f7233924afe27699f681200aa854
|
| 3 |
size 251665797
|
checkpoint-300/global_step300/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665797
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d9fa93e661547109c1e6236c1bce2d0121c254badc78b59a972aa0da951caed
|
| 3 |
size 251665797
|
checkpoint-300/global_step300/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665797
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:801bb9df2223195ef800afd7356c72be7d3386b2f45e9e3ca1f26c5578c130d1
|
| 3 |
size 251665797
|
checkpoint-300/global_step300/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665861
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:973e911c4d50dff1b06947221ca6faf96bacb18293ac4d0b3a531e4e9064a58b
|
| 3 |
size 251665861
|
checkpoint-300/global_step300/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665861
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e5df61d6505848a9c35dcb31e42438b689e3e7a1b4b0b380999a9b4a46bffdd
|
| 3 |
size 251665861
|
checkpoint-300/global_step300/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665861
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e06ba9d695f8b49fc31dab04db9618bd479cc9f4df9e2dc6334fdf37c49e788d
|
| 3 |
size 251665861
|
checkpoint-300/global_step300/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665861
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d804d5260b7722cd10285c1c3636deb95c696fd954693e408e6ede0ee4e51931
|
| 3 |
size 251665861
|
checkpoint-300/global_step300/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665861
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2d80013b0aada9ff159e6bae695e0ff41260c89996489a4be203d22cf2de0a0d
|
| 3 |
size 251665861
|
checkpoint-300/global_step300/mp_rank_00_model_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 447220134
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:461a3122d236e5b58a9e72a64bf1947c13d71ec366ff0d0fa155d2308ffd6242
|
| 3 |
size 447220134
|
checkpoint-300/rng_state_0.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09796da0d7a97c43d5b954b86517caec30cbfcc3b5bb61a2803af5c7633d0413
|
| 3 |
+
size 16453
|
checkpoint-300/rng_state_1.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f21c1e066922df0063a60933ed161962048eeb45b8af04b8eac26055bdf564cb
|
| 3 |
+
size 16389
|
checkpoint-300/rng_state_2.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 16389
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a8bcd44d37ba4e3697215e15340177f9cb971b5335aa823fae2f6c616a7f8b1c
|
| 3 |
size 16389
|
checkpoint-300/rng_state_3.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 16325
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb6a2c1f892fa7778cb9a11d3287ed89e333ebd37430209d6efffc74c0d6cff6
|
| 3 |
size 16325
|
checkpoint-300/rng_state_4.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:96d53aba74b24e3ecdeb9fd542ce73e3b501032da6a744466f6414fa59c06594
|
| 3 |
+
size 16389
|
checkpoint-300/rng_state_5.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 16389
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:753c07da620c81071c41066c8953c5a03b003e4ed3a107966681bbc925d93d70
|
| 3 |
size 16389
|
checkpoint-300/rng_state_6.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:531f76d581428ac56a6898cc170cc28a819930c9fbd0fc5b5e8c254e04a7c9a4
|
| 3 |
+
size 16389
|
checkpoint-300/rng_state_7.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b4961b297199a42b21419f55e0a6922fe51451bbb9156f3fa3410f56bdd1c7c7
|
| 3 |
+
size 16389
|
checkpoint-300/trainer_state.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
checkpoint-300/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 10129
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b2b580dfdced6e43d90902d33846dd582730283be348589cde9c58ad3764659
|
| 3 |
size 10129
|