Training in progress, epoch 7, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step1352/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step1352/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step1352/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step1352/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step1352/mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +169 -3
last-checkpoint/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 555780720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86839f7e37cf9db50d92aa3359c8a951b16bcb9bd19179d97785c9380e60d4de
|
| 3 |
size 555780720
|
last-checkpoint/global_step1352/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa5f32f83b8dd1abdff17aa4d8a62cf2df4d05afc1f775aa2f6b93598139e4b4
|
| 3 |
+
size 418993765
|
last-checkpoint/global_step1352/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5fc2fc0cd5ce123568d266b89c4f539a173812273213ba02d058dfdf7b623daf
|
| 3 |
+
size 418993829
|
last-checkpoint/global_step1352/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dd31753cbe0128c999d089e0b6ae68cd9dc9534e5009bc8833ba113b6cfc75e4
|
| 3 |
+
size 418993829
|
last-checkpoint/global_step1352/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a79f62be1ee42d6d4cdaa1d1ae0c25bb27a3f27a7ee18554197caf2fc8ddc5d
|
| 3 |
+
size 418993829
|
last-checkpoint/global_step1352/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2c178a80caac549930759dd5ddeae56a0eebd44125e85347a79d3546d5ea720a
|
| 3 |
+
size 555959385
|
last-checkpoint/latest
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
|
|
|
|
| 1 |
+
global_step1352
|
last-checkpoint/rng_state_0.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95a3c87bc88363e3f4b77947b12ea79773944af0114a1b604be41b603f0e088e
|
| 3 |
size 15429
|
last-checkpoint/rng_state_1.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:339163084457ee5fe928af6d9e73b4f74db7625bc6e88a289af439ef57976bfb
|
| 3 |
size 15429
|
last-checkpoint/rng_state_2.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d12472ec366ee397869b0f92eb4add458e30b5e37a8a371422c324e97a75e38b
|
| 3 |
size 15429
|
last-checkpoint/rng_state_3.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e20f7fa0cdcee712ddbb996fd4afd5bdb4a4fcb884815462037415fce9b45978
|
| 3 |
size 15429
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06ca58d1a0dee9bbca88545d604f59334241351618fe2f019276217fe27d5f25
|
| 3 |
size 1401
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,10 +1,10 @@
|
|
| 1 |
{
|
| 2 |
"best_global_step": null,
|
| 3 |
-
"best_metric": 0.
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 7.
|
| 6 |
"eval_steps": 50,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -4324,6 +4324,172 @@
|
|
| 4324 |
"eval_samples_per_second": 44.586,
|
| 4325 |
"eval_steps_per_second": 2.834,
|
| 4326 |
"step": 1300
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4327 |
}
|
| 4328 |
],
|
| 4329 |
"logging_steps": 5,
|
|
|
|
| 1 |
{
|
| 2 |
"best_global_step": null,
|
| 3 |
+
"best_metric": 0.13855531811714172,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 7.3358158429248475,
|
| 6 |
"eval_steps": 50,
|
| 7 |
+
"global_step": 1350,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 4324 |
"eval_samples_per_second": 44.586,
|
| 4325 |
"eval_steps_per_second": 2.834,
|
| 4326 |
"step": 1300
|
| 4327 |
+
},
|
| 4328 |
+
{
|
| 4329 |
+
"epoch": 7.0920785375761675,
|
| 4330 |
+
"grad_norm": 0.9328561425209045,
|
| 4331 |
+
"learning_rate": 1.2436575721991239e-05,
|
| 4332 |
+
"logits/chosen": -0.8173828125,
|
| 4333 |
+
"logits/rejected": NaN,
|
| 4334 |
+
"logps/chosen": -368.45001220703125,
|
| 4335 |
+
"logps/rejected": -367.8500061035156,
|
| 4336 |
+
"loss": 0.1569,
|
| 4337 |
+
"rewards/accuracies": 0.9453125,
|
| 4338 |
+
"rewards/chosen": -7.185156345367432,
|
| 4339 |
+
"rewards/margins": 3.2300782203674316,
|
| 4340 |
+
"rewards/rejected": -10.420312881469727,
|
| 4341 |
+
"step": 1305
|
| 4342 |
+
},
|
| 4343 |
+
{
|
| 4344 |
+
"epoch": 7.1191604603926875,
|
| 4345 |
+
"grad_norm": 1.522709608078003,
|
| 4346 |
+
"learning_rate": 1.2432752041311519e-05,
|
| 4347 |
+
"logits/chosen": -0.8003906011581421,
|
| 4348 |
+
"logits/rejected": -0.82373046875,
|
| 4349 |
+
"logps/chosen": -369.20001220703125,
|
| 4350 |
+
"logps/rejected": -381.8999938964844,
|
| 4351 |
+
"loss": 0.1374,
|
| 4352 |
+
"rewards/accuracies": 0.9468749761581421,
|
| 4353 |
+
"rewards/chosen": -6.989062309265137,
|
| 4354 |
+
"rewards/margins": 3.359375,
|
| 4355 |
+
"rewards/rejected": -10.346875190734863,
|
| 4356 |
+
"step": 1310
|
| 4357 |
+
},
|
| 4358 |
+
{
|
| 4359 |
+
"epoch": 7.1462423832092075,
|
| 4360 |
+
"grad_norm": 1.6700057983398438,
|
| 4361 |
+
"learning_rate": 1.2428913301215597e-05,
|
| 4362 |
+
"logits/chosen": NaN,
|
| 4363 |
+
"logits/rejected": -0.8626953363418579,
|
| 4364 |
+
"logps/chosen": -356.04998779296875,
|
| 4365 |
+
"logps/rejected": -373.29998779296875,
|
| 4366 |
+
"loss": 0.1575,
|
| 4367 |
+
"rewards/accuracies": 0.934374988079071,
|
| 4368 |
+
"rewards/chosen": -6.440625190734863,
|
| 4369 |
+
"rewards/margins": 3.438671827316284,
|
| 4370 |
+
"rewards/rejected": -9.872655868530273,
|
| 4371 |
+
"step": 1315
|
| 4372 |
+
},
|
| 4373 |
+
{
|
| 4374 |
+
"epoch": 7.1733243060257275,
|
| 4375 |
+
"grad_norm": 1.6624808311462402,
|
| 4376 |
+
"learning_rate": 1.2425059511367494e-05,
|
| 4377 |
+
"logits/chosen": -0.8272460699081421,
|
| 4378 |
+
"logits/rejected": -0.835644543170929,
|
| 4379 |
+
"logps/chosen": -361.6000061035156,
|
| 4380 |
+
"logps/rejected": -364.6000061035156,
|
| 4381 |
+
"loss": 0.1679,
|
| 4382 |
+
"rewards/accuracies": 0.940625011920929,
|
| 4383 |
+
"rewards/chosen": -6.254687309265137,
|
| 4384 |
+
"rewards/margins": 3.313281297683716,
|
| 4385 |
+
"rewards/rejected": -9.573437690734863,
|
| 4386 |
+
"step": 1320
|
| 4387 |
+
},
|
| 4388 |
+
{
|
| 4389 |
+
"epoch": 7.2004062288422475,
|
| 4390 |
+
"grad_norm": 2.2478160858154297,
|
| 4391 |
+
"learning_rate": 1.2421190681469124e-05,
|
| 4392 |
+
"logits/chosen": -0.782519519329071,
|
| 4393 |
+
"logits/rejected": NaN,
|
| 4394 |
+
"logps/chosen": -355.54998779296875,
|
| 4395 |
+
"logps/rejected": -364.625,
|
| 4396 |
+
"loss": 0.1743,
|
| 4397 |
+
"rewards/accuracies": 0.9437500238418579,
|
| 4398 |
+
"rewards/chosen": -6.853125095367432,
|
| 4399 |
+
"rewards/margins": 2.9222655296325684,
|
| 4400 |
+
"rewards/rejected": -9.770312309265137,
|
| 4401 |
+
"step": 1325
|
| 4402 |
+
},
|
| 4403 |
+
{
|
| 4404 |
+
"epoch": 7.2274881516587675,
|
| 4405 |
+
"grad_norm": 1.1094180345535278,
|
| 4406 |
+
"learning_rate": 1.241730682126026e-05,
|
| 4407 |
+
"logits/chosen": NaN,
|
| 4408 |
+
"logits/rejected": -0.796191394329071,
|
| 4409 |
+
"logps/chosen": -369.8500061035156,
|
| 4410 |
+
"logps/rejected": -372.1000061035156,
|
| 4411 |
+
"loss": 0.1671,
|
| 4412 |
+
"rewards/accuracies": 0.953125,
|
| 4413 |
+
"rewards/chosen": -7.446875095367432,
|
| 4414 |
+
"rewards/margins": 2.931640625,
|
| 4415 |
+
"rewards/rejected": -10.378125190734863,
|
| 4416 |
+
"step": 1330
|
| 4417 |
+
},
|
| 4418 |
+
{
|
| 4419 |
+
"epoch": 7.2545700744752875,
|
| 4420 |
+
"grad_norm": 1.275765299797058,
|
| 4421 |
+
"learning_rate": 1.2413407940518518e-05,
|
| 4422 |
+
"logits/chosen": -0.8089843988418579,
|
| 4423 |
+
"logits/rejected": -0.8099609613418579,
|
| 4424 |
+
"logps/chosen": -370.5,
|
| 4425 |
+
"logps/rejected": -388.04998779296875,
|
| 4426 |
+
"loss": 0.1589,
|
| 4427 |
+
"rewards/accuracies": 0.9453125,
|
| 4428 |
+
"rewards/chosen": -7.414843559265137,
|
| 4429 |
+
"rewards/margins": 3.5,
|
| 4430 |
+
"rewards/rejected": -10.917187690734863,
|
| 4431 |
+
"step": 1335
|
| 4432 |
+
},
|
| 4433 |
+
{
|
| 4434 |
+
"epoch": 7.2816519972918075,
|
| 4435 |
+
"grad_norm": 1.6279685497283936,
|
| 4436 |
+
"learning_rate": 1.2409494049059322e-05,
|
| 4437 |
+
"logits/chosen": NaN,
|
| 4438 |
+
"logits/rejected": -0.7696288824081421,
|
| 4439 |
+
"logps/chosen": -366.95001220703125,
|
| 4440 |
+
"logps/rejected": -403.3500061035156,
|
| 4441 |
+
"loss": 0.1804,
|
| 4442 |
+
"rewards/accuracies": 0.9296875,
|
| 4443 |
+
"rewards/chosen": -7.529687404632568,
|
| 4444 |
+
"rewards/margins": 3.614453077316284,
|
| 4445 |
+
"rewards/rejected": -11.146875381469727,
|
| 4446 |
+
"step": 1340
|
| 4447 |
+
},
|
| 4448 |
+
{
|
| 4449 |
+
"epoch": 7.3087339201083275,
|
| 4450 |
+
"grad_norm": 1.6767570972442627,
|
| 4451 |
+
"learning_rate": 1.2405565156735891e-05,
|
| 4452 |
+
"logits/chosen": -0.6883789300918579,
|
| 4453 |
+
"logits/rejected": -0.69970703125,
|
| 4454 |
+
"logps/chosen": -386.6499938964844,
|
| 4455 |
+
"logps/rejected": -387.95001220703125,
|
| 4456 |
+
"loss": 0.1821,
|
| 4457 |
+
"rewards/accuracies": 0.925000011920929,
|
| 4458 |
+
"rewards/chosen": -7.953906059265137,
|
| 4459 |
+
"rewards/margins": 3.3148436546325684,
|
| 4460 |
+
"rewards/rejected": -11.268750190734863,
|
| 4461 |
+
"step": 1345
|
| 4462 |
+
},
|
| 4463 |
+
{
|
| 4464 |
+
"epoch": 7.3358158429248475,
|
| 4465 |
+
"grad_norm": 1.182672142982483,
|
| 4466 |
+
"learning_rate": 1.2401621273439206e-05,
|
| 4467 |
+
"logits/chosen": -0.683789074420929,
|
| 4468 |
+
"logits/rejected": -0.6509765386581421,
|
| 4469 |
+
"logps/chosen": -375.29998779296875,
|
| 4470 |
+
"logps/rejected": -388.8999938964844,
|
| 4471 |
+
"loss": 0.1432,
|
| 4472 |
+
"rewards/accuracies": 0.949999988079071,
|
| 4473 |
+
"rewards/chosen": -7.917187690734863,
|
| 4474 |
+
"rewards/margins": 3.202343702316284,
|
| 4475 |
+
"rewards/rejected": -11.123437881469727,
|
| 4476 |
+
"step": 1350
|
| 4477 |
+
},
|
| 4478 |
+
{
|
| 4479 |
+
"epoch": 7.3358158429248475,
|
| 4480 |
+
"eval_logits/chosen": -0.6861979365348816,
|
| 4481 |
+
"eval_logits/rejected": NaN,
|
| 4482 |
+
"eval_logps/chosen": -375.1111145019531,
|
| 4483 |
+
"eval_logps/rejected": -389.20001220703125,
|
| 4484 |
+
"eval_loss": 0.13855531811714172,
|
| 4485 |
+
"eval_rewards/accuracies": 0.9513888955116272,
|
| 4486 |
+
"eval_rewards/chosen": -7.346527576446533,
|
| 4487 |
+
"eval_rewards/margins": 3.3333332538604736,
|
| 4488 |
+
"eval_rewards/rejected": -10.679166793823242,
|
| 4489 |
+
"eval_runtime": 15.8625,
|
| 4490 |
+
"eval_samples_per_second": 44.634,
|
| 4491 |
+
"eval_steps_per_second": 2.837,
|
| 4492 |
+
"step": 1350
|
| 4493 |
}
|
| 4494 |
],
|
| 4495 |
"logging_steps": 5,
|