Training in progress, epoch 0, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step750/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step750/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step750/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step750/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step750/mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +169 -3
last-checkpoint/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1172343536
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4f419d2d3dc57b9b2d5c6ee5508bee95ca09509bd414a8b7fa7c7718b5aa160
|
| 3 |
size 1172343536
|
last-checkpoint/global_step750/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3d177e315e852cf4627e36ccb15bcf1302de2d429e142f1fb08e8d95b7222b7
|
| 3 |
+
size 883824229
|
last-checkpoint/global_step750/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f67988ef568a7b0c3e041d4b7e055fb02fdaadfe44f317ce11b49cfd58c35e45
|
| 3 |
+
size 883824293
|
last-checkpoint/global_step750/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b24df66b44e762e5e340a1d75b1b7e8fc23eec1e224a3e277a6f1289324fb8a9
|
| 3 |
+
size 883824293
|
last-checkpoint/global_step750/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:386c808328d5a03447186a75b5384d45e32af06d9db22785835f980d07184230
|
| 3 |
+
size 883824293
|
last-checkpoint/global_step750/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:423e021a58e384c391c6356f223e5662047217391843f6005d78f92fd65a5a5e
|
| 3 |
+
size 1172522073
|
last-checkpoint/latest
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
|
|
|
|
| 1 |
+
global_step750
|
last-checkpoint/rng_state_0.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8de88920dd9878e568a9d7575b3f30ad8fdfb7e3eb727df0f444fd44869f433d
|
| 3 |
size 15429
|
last-checkpoint/rng_state_1.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e5ad1aac8326d87db53ac90a0364b235b873c9915753b0b1e35cc6c162d6df2
|
| 3 |
size 15429
|
last-checkpoint/rng_state_2.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30aeac380cd7c431ed27d5b99b2dc98aee263183c538104d162fc5f56ac80ce0
|
| 3 |
size 15429
|
last-checkpoint/rng_state_3.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19982de75038fe4dec09b91b36d57d5f858fa950160c70e61093a4adb556ba83
|
| 3 |
size 15429
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:590163296bdb7eb3469073cd35bc51902c716a216d6f5cdd237060726449c33c
|
| 3 |
size 1401
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,10 +1,10 @@
|
|
| 1 |
{
|
| 2 |
"best_global_step": null,
|
| 3 |
-
"best_metric": 0.
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 50,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -2332,6 +2332,172 @@
|
|
| 2332 |
"eval_samples_per_second": 45.331,
|
| 2333 |
"eval_steps_per_second": 2.841,
|
| 2334 |
"step": 700
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2335 |
}
|
| 2336 |
],
|
| 2337 |
"logging_steps": 5,
|
|
|
|
| 1 |
{
|
| 2 |
"best_global_step": null,
|
| 3 |
+
"best_metric": 0.021692628040909767,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.6514657980456026,
|
| 6 |
"eval_steps": 50,
|
| 7 |
+
"global_step": 750,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 2332 |
"eval_samples_per_second": 45.331,
|
| 2333 |
"eval_steps_per_second": 2.841,
|
| 2334 |
"step": 700
|
| 2335 |
+
},
|
| 2336 |
+
{
|
| 2337 |
+
"epoch": 0.6123778501628665,
|
| 2338 |
+
"grad_norm": 0.4941781461238861,
|
| 2339 |
+
"learning_rate": 2.5752849078774175e-05,
|
| 2340 |
+
"logits/chosen": -1.190332055091858,
|
| 2341 |
+
"logits/rejected": -1.6921875476837158,
|
| 2342 |
+
"logps/chosen": -99.82499694824219,
|
| 2343 |
+
"logps/rejected": -199.77499389648438,
|
| 2344 |
+
"loss": 0.0231,
|
| 2345 |
+
"rewards/accuracies": 0.995312511920929,
|
| 2346 |
+
"rewards/chosen": -2.4974608421325684,
|
| 2347 |
+
"rewards/margins": 13.4296875,
|
| 2348 |
+
"rewards/rejected": -15.926562309265137,
|
| 2349 |
+
"step": 705
|
| 2350 |
+
},
|
| 2351 |
+
{
|
| 2352 |
+
"epoch": 0.6167209554831705,
|
| 2353 |
+
"grad_norm": 0.8641561269760132,
|
| 2354 |
+
"learning_rate": 2.5748905089671384e-05,
|
| 2355 |
+
"logits/chosen": -1.181249976158142,
|
| 2356 |
+
"logits/rejected": -1.7000000476837158,
|
| 2357 |
+
"logps/chosen": -98.61250305175781,
|
| 2358 |
+
"logps/rejected": -195.6750030517578,
|
| 2359 |
+
"loss": 0.0268,
|
| 2360 |
+
"rewards/accuracies": 0.989062488079071,
|
| 2361 |
+
"rewards/chosen": -2.160937547683716,
|
| 2362 |
+
"rewards/margins": 13.271875381469727,
|
| 2363 |
+
"rewards/rejected": -15.4375,
|
| 2364 |
+
"step": 710
|
| 2365 |
+
},
|
| 2366 |
+
{
|
| 2367 |
+
"epoch": 0.6210640608034745,
|
| 2368 |
+
"grad_norm": 1.3184161186218262,
|
| 2369 |
+
"learning_rate": 2.574492899366642e-05,
|
| 2370 |
+
"logits/chosen": -1.0817382335662842,
|
| 2371 |
+
"logits/rejected": -1.6388671398162842,
|
| 2372 |
+
"logps/chosen": -96.3125,
|
| 2373 |
+
"logps/rejected": -200.47500610351562,
|
| 2374 |
+
"loss": 0.0193,
|
| 2375 |
+
"rewards/accuracies": 0.9921875,
|
| 2376 |
+
"rewards/chosen": -1.3796875476837158,
|
| 2377 |
+
"rewards/margins": 14.248437881469727,
|
| 2378 |
+
"rewards/rejected": -15.629687309265137,
|
| 2379 |
+
"step": 715
|
| 2380 |
+
},
|
| 2381 |
+
{
|
| 2382 |
+
"epoch": 0.6254071661237784,
|
| 2383 |
+
"grad_norm": 0.4678487479686737,
|
| 2384 |
+
"learning_rate": 2.5740920800769096e-05,
|
| 2385 |
+
"logits/chosen": -1.0939452648162842,
|
| 2386 |
+
"logits/rejected": -1.6455078125,
|
| 2387 |
+
"logps/chosen": -95.30000305175781,
|
| 2388 |
+
"logps/rejected": -211.9499969482422,
|
| 2389 |
+
"loss": 0.0156,
|
| 2390 |
+
"rewards/accuracies": 0.9937499761581421,
|
| 2391 |
+
"rewards/chosen": -1.7891356945037842,
|
| 2392 |
+
"rewards/margins": 16.373437881469727,
|
| 2393 |
+
"rewards/rejected": -18.157812118530273,
|
| 2394 |
+
"step": 720
|
| 2395 |
+
},
|
| 2396 |
+
{
|
| 2397 |
+
"epoch": 0.6297502714440825,
|
| 2398 |
+
"grad_norm": 0.20339182019233704,
|
| 2399 |
+
"learning_rate": 2.5736880521070034e-05,
|
| 2400 |
+
"logits/chosen": -1.130468726158142,
|
| 2401 |
+
"logits/rejected": -1.6033203601837158,
|
| 2402 |
+
"logps/chosen": -99.1500015258789,
|
| 2403 |
+
"logps/rejected": -221.72500610351562,
|
| 2404 |
+
"loss": 0.0196,
|
| 2405 |
+
"rewards/accuracies": 0.9937499761581421,
|
| 2406 |
+
"rewards/chosen": -2.719921827316284,
|
| 2407 |
+
"rewards/margins": 17.65625,
|
| 2408 |
+
"rewards/rejected": -20.381250381469727,
|
| 2409 |
+
"step": 725
|
| 2410 |
+
},
|
| 2411 |
+
{
|
| 2412 |
+
"epoch": 0.6340933767643865,
|
| 2413 |
+
"grad_norm": 0.7277128100395203,
|
| 2414 |
+
"learning_rate": 2.5732808164740634e-05,
|
| 2415 |
+
"logits/chosen": -1.0881836414337158,
|
| 2416 |
+
"logits/rejected": -1.5712890625,
|
| 2417 |
+
"logps/chosen": -102.1875,
|
| 2418 |
+
"logps/rejected": -225.875,
|
| 2419 |
+
"loss": 0.0202,
|
| 2420 |
+
"rewards/accuracies": 0.996874988079071,
|
| 2421 |
+
"rewards/chosen": -2.8536133766174316,
|
| 2422 |
+
"rewards/margins": 17.546875,
|
| 2423 |
+
"rewards/rejected": -20.390625,
|
| 2424 |
+
"step": 730
|
| 2425 |
+
},
|
| 2426 |
+
{
|
| 2427 |
+
"epoch": 0.6384364820846905,
|
| 2428 |
+
"grad_norm": 2.4315991401672363,
|
| 2429 |
+
"learning_rate": 2.5728703742033047e-05,
|
| 2430 |
+
"logits/chosen": -1.0305664539337158,
|
| 2431 |
+
"logits/rejected": -1.572656273841858,
|
| 2432 |
+
"logps/chosen": -100.61250305175781,
|
| 2433 |
+
"logps/rejected": -218.1750030517578,
|
| 2434 |
+
"loss": 0.0522,
|
| 2435 |
+
"rewards/accuracies": 0.987500011920929,
|
| 2436 |
+
"rewards/chosen": -2.8978514671325684,
|
| 2437 |
+
"rewards/margins": 16.684375762939453,
|
| 2438 |
+
"rewards/rejected": -19.587499618530273,
|
| 2439 |
+
"step": 735
|
| 2440 |
+
},
|
| 2441 |
+
{
|
| 2442 |
+
"epoch": 0.6427795874049945,
|
| 2443 |
+
"grad_norm": 0.8356490135192871,
|
| 2444 |
+
"learning_rate": 2.5724567263280155e-05,
|
| 2445 |
+
"logits/chosen": -1.006445288658142,
|
| 2446 |
+
"logits/rejected": -1.5927734375,
|
| 2447 |
+
"logps/chosen": -101.0,
|
| 2448 |
+
"logps/rejected": -210.22500610351562,
|
| 2449 |
+
"loss": 0.0369,
|
| 2450 |
+
"rewards/accuracies": 0.987500011920929,
|
| 2451 |
+
"rewards/chosen": -2.7152342796325684,
|
| 2452 |
+
"rewards/margins": 15.609375,
|
| 2453 |
+
"rewards/rejected": -18.337499618530273,
|
| 2454 |
+
"step": 740
|
| 2455 |
+
},
|
| 2456 |
+
{
|
| 2457 |
+
"epoch": 0.6471226927252985,
|
| 2458 |
+
"grad_norm": 0.9469047784805298,
|
| 2459 |
+
"learning_rate": 2.5720398738895534e-05,
|
| 2460 |
+
"logits/chosen": -0.9302734136581421,
|
| 2461 |
+
"logits/rejected": -1.529296875,
|
| 2462 |
+
"logps/chosen": -98.8375015258789,
|
| 2463 |
+
"logps/rejected": -204.625,
|
| 2464 |
+
"loss": 0.0399,
|
| 2465 |
+
"rewards/accuracies": 0.9921875,
|
| 2466 |
+
"rewards/chosen": -2.419726610183716,
|
| 2467 |
+
"rewards/margins": 14.510937690734863,
|
| 2468 |
+
"rewards/rejected": -16.928125381469727,
|
| 2469 |
+
"step": 745
|
| 2470 |
+
},
|
| 2471 |
+
{
|
| 2472 |
+
"epoch": 0.6514657980456026,
|
| 2473 |
+
"grad_norm": 0.25593864917755127,
|
| 2474 |
+
"learning_rate": 2.571619817937344e-05,
|
| 2475 |
+
"logits/chosen": -0.8580077886581421,
|
| 2476 |
+
"logits/rejected": -1.470703125,
|
| 2477 |
+
"logps/chosen": -101.9625015258789,
|
| 2478 |
+
"logps/rejected": -205.14999389648438,
|
| 2479 |
+
"loss": 0.0313,
|
| 2480 |
+
"rewards/accuracies": 0.9906250238418579,
|
| 2481 |
+
"rewards/chosen": -2.443164110183716,
|
| 2482 |
+
"rewards/margins": 14.162500381469727,
|
| 2483 |
+
"rewards/rejected": -16.6015625,
|
| 2484 |
+
"step": 750
|
| 2485 |
+
},
|
| 2486 |
+
{
|
| 2487 |
+
"epoch": 0.6514657980456026,
|
| 2488 |
+
"eval_logits/chosen": -0.7763848304748535,
|
| 2489 |
+
"eval_logits/rejected": -1.4033167362213135,
|
| 2490 |
+
"eval_logps/chosen": -98.74909973144531,
|
| 2491 |
+
"eval_logps/rejected": -200.59567260742188,
|
| 2492 |
+
"eval_loss": 0.021692628040909767,
|
| 2493 |
+
"eval_rewards/accuracies": 0.9925541281700134,
|
| 2494 |
+
"eval_rewards/chosen": -2.211261749267578,
|
| 2495 |
+
"eval_rewards/margins": 13.938854217529297,
|
| 2496 |
+
"eval_rewards/rejected": -16.1518497467041,
|
| 2497 |
+
"eval_runtime": 97.7492,
|
| 2498 |
+
"eval_samples_per_second": 45.218,
|
| 2499 |
+
"eval_steps_per_second": 2.834,
|
| 2500 |
+
"step": 750
|
| 2501 |
}
|
| 2502 |
],
|
| 2503 |
"logging_steps": 5,
|