Model save
Browse files- best/global_step150/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- best/global_step150/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- best/global_step150/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- best/global_step150/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- best/global_step150/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- best/global_step150/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- best/global_step150/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- best/global_step150/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- best/global_step150/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- best/global_step150/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- best/global_step150/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- best/global_step150/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- best/global_step150/zero_pp_rank_4_mp_rank_00_model_states.pt +3 -0
- best/global_step150/zero_pp_rank_5_mp_rank_00_model_states.pt +3 -0
- best/global_step150/zero_pp_rank_6_mp_rank_00_model_states.pt +3 -0
- best/global_step150/zero_pp_rank_7_mp_rank_00_model_states.pt +3 -0
- best/latest +1 -1
- best/monitor.json +5 -5
- global_step150/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- global_step150/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- global_step150/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- global_step150/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- global_step150/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- global_step150/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- global_step150/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- global_step150/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- global_step150/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- global_step150/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- global_step150/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- global_step150/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- global_step150/zero_pp_rank_4_mp_rank_00_model_states.pt +3 -0
- global_step150/zero_pp_rank_5_mp_rank_00_model_states.pt +3 -0
- global_step150/zero_pp_rank_6_mp_rank_00_model_states.pt +3 -0
- global_step150/zero_pp_rank_7_mp_rank_00_model_states.pt +3 -0
- latest +1 -1
- logs/events.out.tfevents.1754432204.1506d310068f.1511638.0 +2 -2
best/global_step150/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b45eb93de468bc2e16661b2f1986065488d3dca32246535fcf7748e2b82c8b4f
|
| 3 |
+
size 12286638307
|
best/global_step150/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fab3742efd05e45a75c35f06b93ae8835d9f79b54ee3f06586afe12c7cedd787
|
| 3 |
+
size 12286638307
|
best/global_step150/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b69d0cc87bb338243f011f797bf92cc89e02c4727e59eb23c0aaf9c0a9e3a38
|
| 3 |
+
size 12286638307
|
best/global_step150/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6df1e6cefc1b991f0e752acb2f33e9f4b77d705dfd7b594cea12c766b233a472
|
| 3 |
+
size 12286638307
|
best/global_step150/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dce9e97c4584ada3dfdc0f4970471af77b8f2a5bd43ceb77fa2fdda2f3686eb7
|
| 3 |
+
size 12286638307
|
best/global_step150/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88be19313236d15b7ca105005ccd42f3572278fb0ef0803fa1d0949e1af41435
|
| 3 |
+
size 12286638307
|
best/global_step150/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b8e4d1692b35b2db6fd26284266875acfb78df893b56fdd0b7c5a4f857f08e7
|
| 3 |
+
size 12286638307
|
best/global_step150/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da535fe23b4b7b5c851b47ced81d1806ee798fccf84ab6985acfa70473006389
|
| 3 |
+
size 12286638307
|
best/global_step150/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f7758d880d96838c48768f98dbfa3b6e440dd6654c802a4793323c4df78c127
|
| 3 |
+
size 206444
|
best/global_step150/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e8a3728183612ed728c80b8219d0e1d9a587023d8f64f5cac3a3b1fbfba7db92
|
| 3 |
+
size 206444
|
best/global_step150/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab599a1a1daa2152e8008888b9fba22a9f21b0f9878ad19e794ffc4f07a3ab45
|
| 3 |
+
size 206444
|
best/global_step150/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:622f0c2b4b7d373a0f918bad376c958d5e2d4474110aafad87efd75086a2e9f3
|
| 3 |
+
size 206444
|
best/global_step150/zero_pp_rank_4_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4e36509707d4576df45892a03617962ee521e31a5407b91a64cba810e1448efe
|
| 3 |
+
size 206444
|
best/global_step150/zero_pp_rank_5_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dfd6cdce3eae912dce3c3267f34da45bf4c0b3eb67e09f8ff26c0ea61f9b625f
|
| 3 |
+
size 206444
|
best/global_step150/zero_pp_rank_6_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a4b4b4a34bd0b0d9f940958a6de16839b5becf74b6337fbf435262151285449
|
| 3 |
+
size 206444
|
best/global_step150/zero_pp_rank_7_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ff35bace19748fb1f00f1fed6a9440f7d37e7a65f4925aae7b285e76234e0f7
|
| 3 |
+
size 206444
|
best/latest
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
|
|
|
|
| 1 |
+
global_step150
|
best/monitor.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
-
"global_step":
|
| 3 |
-
"test1_loss": 0.
|
| 4 |
-
"test2_loss": 0.
|
| 5 |
-
"test3_loss": 0.
|
| 6 |
-
"combined_test_loss": 0.
|
| 7 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"global_step": 150,
|
| 3 |
+
"test1_loss": 0.5349587609413929,
|
| 4 |
+
"test2_loss": 0.6594466084215839,
|
| 5 |
+
"test3_loss": 0.4015509325333617,
|
| 6 |
+
"combined_test_loss": 0.6594466084215839
|
| 7 |
}
|
global_step150/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b45eb93de468bc2e16661b2f1986065488d3dca32246535fcf7748e2b82c8b4f
|
| 3 |
+
size 12286638307
|
global_step150/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fab3742efd05e45a75c35f06b93ae8835d9f79b54ee3f06586afe12c7cedd787
|
| 3 |
+
size 12286638307
|
global_step150/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b69d0cc87bb338243f011f797bf92cc89e02c4727e59eb23c0aaf9c0a9e3a38
|
| 3 |
+
size 12286638307
|
global_step150/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6df1e6cefc1b991f0e752acb2f33e9f4b77d705dfd7b594cea12c766b233a472
|
| 3 |
+
size 12286638307
|
global_step150/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dce9e97c4584ada3dfdc0f4970471af77b8f2a5bd43ceb77fa2fdda2f3686eb7
|
| 3 |
+
size 12286638307
|
global_step150/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88be19313236d15b7ca105005ccd42f3572278fb0ef0803fa1d0949e1af41435
|
| 3 |
+
size 12286638307
|
global_step150/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b8e4d1692b35b2db6fd26284266875acfb78df893b56fdd0b7c5a4f857f08e7
|
| 3 |
+
size 12286638307
|
global_step150/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da535fe23b4b7b5c851b47ced81d1806ee798fccf84ab6985acfa70473006389
|
| 3 |
+
size 12286638307
|
global_step150/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f7758d880d96838c48768f98dbfa3b6e440dd6654c802a4793323c4df78c127
|
| 3 |
+
size 206444
|
global_step150/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e8a3728183612ed728c80b8219d0e1d9a587023d8f64f5cac3a3b1fbfba7db92
|
| 3 |
+
size 206444
|
global_step150/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab599a1a1daa2152e8008888b9fba22a9f21b0f9878ad19e794ffc4f07a3ab45
|
| 3 |
+
size 206444
|
global_step150/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:622f0c2b4b7d373a0f918bad376c958d5e2d4474110aafad87efd75086a2e9f3
|
| 3 |
+
size 206444
|
global_step150/zero_pp_rank_4_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4e36509707d4576df45892a03617962ee521e31a5407b91a64cba810e1448efe
|
| 3 |
+
size 206444
|
global_step150/zero_pp_rank_5_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dfd6cdce3eae912dce3c3267f34da45bf4c0b3eb67e09f8ff26c0ea61f9b625f
|
| 3 |
+
size 206444
|
global_step150/zero_pp_rank_6_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a4b4b4a34bd0b0d9f940958a6de16839b5becf74b6337fbf435262151285449
|
| 3 |
+
size 206444
|
global_step150/zero_pp_rank_7_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ff35bace19748fb1f00f1fed6a9440f7d37e7a65f4925aae7b285e76234e0f7
|
| 3 |
+
size 206444
|
latest
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
|
|
|
|
| 1 |
+
global_step150
|
logs/events.out.tfevents.1754432204.1506d310068f.1511638.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6ccc6c583aaaced879971fe03cac73290929c32c385bc5bbfcf980865d0b3354
|
| 3 |
+
size 57175
|