Training in progress, step 2300, checkpoint
Browse files- checkpoint-2300/adapter_config.json +4 -4
- checkpoint-2300/adapter_model.safetensors +1 -1
- checkpoint-2300/global_step2300/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +1 -1
- checkpoint-2300/global_step2300/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +1 -1
- checkpoint-2300/global_step2300/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +1 -1
- checkpoint-2300/global_step2300/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +1 -1
- checkpoint-2300/global_step2300/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +1 -1
- checkpoint-2300/global_step2300/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +1 -1
- checkpoint-2300/global_step2300/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +1 -1
- checkpoint-2300/global_step2300/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +1 -1
- checkpoint-2300/global_step2300/mp_rank_00_model_states.pt +1 -1
- checkpoint-2300/rng_state_0.pth +1 -1
- checkpoint-2300/rng_state_1.pth +1 -1
- checkpoint-2300/rng_state_2.pth +2 -2
- checkpoint-2300/rng_state_3.pth +1 -1
- checkpoint-2300/rng_state_4.pth +2 -2
- checkpoint-2300/rng_state_5.pth +2 -2
- checkpoint-2300/rng_state_6.pth +1 -1
- checkpoint-2300/rng_state_7.pth +2 -2
- checkpoint-2300/trainer_state.json +0 -0
- checkpoint-2300/training_args.bin +1 -1
checkpoint-2300/adapter_config.json
CHANGED
|
@@ -24,13 +24,13 @@
|
|
| 24 |
"rank_pattern": {},
|
| 25 |
"revision": null,
|
| 26 |
"target_modules": [
|
| 27 |
-
"
|
| 28 |
"up_proj",
|
| 29 |
"gate_proj",
|
| 30 |
"v_proj",
|
| 31 |
-
"
|
| 32 |
-
"
|
| 33 |
-
"
|
| 34 |
],
|
| 35 |
"task_type": "CAUSAL_LM",
|
| 36 |
"trainable_token_indices": null,
|
|
|
|
| 24 |
"rank_pattern": {},
|
| 25 |
"revision": null,
|
| 26 |
"target_modules": [
|
| 27 |
+
"k_proj",
|
| 28 |
"up_proj",
|
| 29 |
"gate_proj",
|
| 30 |
"v_proj",
|
| 31 |
+
"down_proj",
|
| 32 |
+
"o_proj",
|
| 33 |
+
"q_proj"
|
| 34 |
],
|
| 35 |
"task_type": "CAUSAL_LM",
|
| 36 |
"trainable_token_indices": null,
|
checkpoint-2300/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 335580296
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fc227a0d18135e7ca3db824172f1e7470eb6ce135ace64dae49fd68986093833
|
| 3 |
size 335580296
|
checkpoint-2300/global_step2300/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665797
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f538f011f4477c9a37480357d5605367324f95e4fe60f6c73aa049a68b83678
|
| 3 |
size 251665797
|
checkpoint-2300/global_step2300/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665797
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9abf8e6a7f5f2e14e8c13f5c8f760e4ca1cd01f2b94bf3463af91a934d110d34
|
| 3 |
size 251665797
|
checkpoint-2300/global_step2300/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665797
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41fb4505aedbede6809d094f35af8ffc630141f389fd750aaec8786d34399163
|
| 3 |
size 251665797
|
checkpoint-2300/global_step2300/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665861
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3c24ebc15c6c34e63355fed7d9a3272e5e97403a680c1f2d2633e2e6d27aafc5
|
| 3 |
size 251665861
|
checkpoint-2300/global_step2300/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665861
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4a70340fcbd47feaad71b8ef217ac4a12210256bc571fbb5754b4fe1c443504
|
| 3 |
size 251665861
|
checkpoint-2300/global_step2300/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665861
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:290bd9be59be2daade4e2e6332d209905d89de2569f3f79d12c8b6f97e33aa13
|
| 3 |
size 251665861
|
checkpoint-2300/global_step2300/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665861
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:21403da810cfaf5ab971a16d03727deb13ea8950c1e246f260f13dac44e5b1b3
|
| 3 |
size 251665861
|
checkpoint-2300/global_step2300/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 251665861
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0fb4e0fe6617492537bbbf4df03f9f8d6a6560c93de436e152a925f00e3e4ae3
|
| 3 |
size 251665861
|
checkpoint-2300/global_step2300/mp_rank_00_model_states.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 447220134
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:57ae6e121b6ad0a4ca3567359de04fe151fba08e93cb23139ab87da8652c92ad
|
| 3 |
size 447220134
|
checkpoint-2300/rng_state_0.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 16389
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:43047b40d8c52eabe7d48e1ba69ff8832ffcca8f58f0af738fba7e6544c08526
|
| 3 |
size 16389
|
checkpoint-2300/rng_state_1.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 16325
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3cfa1472e2672b6d519fa8e55fa57770361ef1858b7375c46d09182fafe94d8b
|
| 3 |
size 16325
|
checkpoint-2300/rng_state_2.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:67d7cf3abe89756f5567971af6f5fa58a745ee5192cf2d4f0a69547f851e9da6
|
| 3 |
+
size 16389
|
checkpoint-2300/rng_state_3.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 16453
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:44eae2ebd5a72a844ba58cc3e96f2758b3cad9bcee49332720ec7d630b415096
|
| 3 |
size 16453
|
checkpoint-2300/rng_state_4.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac88818d7bfbd09e0f9158debc9ca0fc0b3f847bb4e9e51c28ce69b7ef5dd055
|
| 3 |
+
size 16453
|
checkpoint-2300/rng_state_5.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:05fa6094427925a6af04ceaf32c36aba1b0918d40dfdde8fbac7e13ee74cce04
|
| 3 |
+
size 16389
|
checkpoint-2300/rng_state_6.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 16389
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef7c0ad4c96ce98362e36157f48860a9e456e323fde53a888717a5e39df7a051
|
| 3 |
size 16389
|
checkpoint-2300/rng_state_7.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:924419e317273397b7e71ceaec67a18a08720b754983eaca11cfd6686b2cba19
|
| 3 |
+
size 16453
|
checkpoint-2300/trainer_state.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
checkpoint-2300/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 10129
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b2b580dfdced6e43d90902d33846dd582730283be348589cde9c58ad3764659
|
| 3 |
size 10129
|