FormlessAI commited on
Commit
d8d4bce
·
verified ·
1 Parent(s): 2a87bda

Training in progress, epoch 0, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a25f53b86cb0d18e76005ef7631a16e5d28e2c4b40e63c63c5944927040e7cae
3
  size 1172343536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4f419d2d3dc57b9b2d5c6ee5508bee95ca09509bd414a8b7fa7c7718b5aa160
3
  size 1172343536
last-checkpoint/global_step750/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3d177e315e852cf4627e36ccb15bcf1302de2d429e142f1fb08e8d95b7222b7
3
+ size 883824229
last-checkpoint/global_step750/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f67988ef568a7b0c3e041d4b7e055fb02fdaadfe44f317ce11b49cfd58c35e45
3
+ size 883824293
last-checkpoint/global_step750/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b24df66b44e762e5e340a1d75b1b7e8fc23eec1e224a3e277a6f1289324fb8a9
3
+ size 883824293
last-checkpoint/global_step750/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:386c808328d5a03447186a75b5384d45e32af06d9db22785835f980d07184230
3
+ size 883824293
last-checkpoint/global_step750/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:423e021a58e384c391c6356f223e5662047217391843f6005d78f92fd65a5a5e
3
+ size 1172522073
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step700
 
1
+ global_step750
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f67957e71beac3aac584ce7da49055cc9c7edaf3d732505bfffa5511f709f41
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8de88920dd9878e568a9d7575b3f30ad8fdfb7e3eb727df0f444fd44869f433d
3
  size 15429
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:305594a2a478d20bb06c74dcc62d37dde101425234afb4331ef411c36814de11
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e5ad1aac8326d87db53ac90a0364b235b873c9915753b0b1e35cc6c162d6df2
3
  size 15429
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1eb2d84f63d7341151dcb60706643579b7c3105045d9ce41fc7fd7aa2c6c8fb0
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30aeac380cd7c431ed27d5b99b2dc98aee263183c538104d162fc5f56ac80ce0
3
  size 15429
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5633e0320a424cdde99e10e62d0382c89fdf5b90d88d95ba4955f9644083937
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19982de75038fe4dec09b91b36d57d5f858fa950160c70e61093a4adb556ba83
3
  size 15429
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:336d3de2036e71626b0f815e82e0c2ae29554f5ccd7af556bd21908e68a7f924
3
  size 1401
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:590163296bdb7eb3469073cd35bc51902c716a216d6f5cdd237060726449c33c
3
  size 1401
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
  "best_global_step": null,
3
- "best_metric": 0.028052611276507378,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.6080347448425625,
6
  "eval_steps": 50,
7
- "global_step": 700,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2332,6 +2332,172 @@
2332
  "eval_samples_per_second": 45.331,
2333
  "eval_steps_per_second": 2.841,
2334
  "step": 700
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2335
  }
2336
  ],
2337
  "logging_steps": 5,
 
1
  {
2
  "best_global_step": null,
3
+ "best_metric": 0.021692628040909767,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.6514657980456026,
6
  "eval_steps": 50,
7
+ "global_step": 750,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2332
  "eval_samples_per_second": 45.331,
2333
  "eval_steps_per_second": 2.841,
2334
  "step": 700
2335
+ },
2336
+ {
2337
+ "epoch": 0.6123778501628665,
2338
+ "grad_norm": 0.4941781461238861,
2339
+ "learning_rate": 2.5752849078774175e-05,
2340
+ "logits/chosen": -1.190332055091858,
2341
+ "logits/rejected": -1.6921875476837158,
2342
+ "logps/chosen": -99.82499694824219,
2343
+ "logps/rejected": -199.77499389648438,
2344
+ "loss": 0.0231,
2345
+ "rewards/accuracies": 0.995312511920929,
2346
+ "rewards/chosen": -2.4974608421325684,
2347
+ "rewards/margins": 13.4296875,
2348
+ "rewards/rejected": -15.926562309265137,
2349
+ "step": 705
2350
+ },
2351
+ {
2352
+ "epoch": 0.6167209554831705,
2353
+ "grad_norm": 0.8641561269760132,
2354
+ "learning_rate": 2.5748905089671384e-05,
2355
+ "logits/chosen": -1.181249976158142,
2356
+ "logits/rejected": -1.7000000476837158,
2357
+ "logps/chosen": -98.61250305175781,
2358
+ "logps/rejected": -195.6750030517578,
2359
+ "loss": 0.0268,
2360
+ "rewards/accuracies": 0.989062488079071,
2361
+ "rewards/chosen": -2.160937547683716,
2362
+ "rewards/margins": 13.271875381469727,
2363
+ "rewards/rejected": -15.4375,
2364
+ "step": 710
2365
+ },
2366
+ {
2367
+ "epoch": 0.6210640608034745,
2368
+ "grad_norm": 1.3184161186218262,
2369
+ "learning_rate": 2.574492899366642e-05,
2370
+ "logits/chosen": -1.0817382335662842,
2371
+ "logits/rejected": -1.6388671398162842,
2372
+ "logps/chosen": -96.3125,
2373
+ "logps/rejected": -200.47500610351562,
2374
+ "loss": 0.0193,
2375
+ "rewards/accuracies": 0.9921875,
2376
+ "rewards/chosen": -1.3796875476837158,
2377
+ "rewards/margins": 14.248437881469727,
2378
+ "rewards/rejected": -15.629687309265137,
2379
+ "step": 715
2380
+ },
2381
+ {
2382
+ "epoch": 0.6254071661237784,
2383
+ "grad_norm": 0.4678487479686737,
2384
+ "learning_rate": 2.5740920800769096e-05,
2385
+ "logits/chosen": -1.0939452648162842,
2386
+ "logits/rejected": -1.6455078125,
2387
+ "logps/chosen": -95.30000305175781,
2388
+ "logps/rejected": -211.9499969482422,
2389
+ "loss": 0.0156,
2390
+ "rewards/accuracies": 0.9937499761581421,
2391
+ "rewards/chosen": -1.7891356945037842,
2392
+ "rewards/margins": 16.373437881469727,
2393
+ "rewards/rejected": -18.157812118530273,
2394
+ "step": 720
2395
+ },
2396
+ {
2397
+ "epoch": 0.6297502714440825,
2398
+ "grad_norm": 0.20339182019233704,
2399
+ "learning_rate": 2.5736880521070034e-05,
2400
+ "logits/chosen": -1.130468726158142,
2401
+ "logits/rejected": -1.6033203601837158,
2402
+ "logps/chosen": -99.1500015258789,
2403
+ "logps/rejected": -221.72500610351562,
2404
+ "loss": 0.0196,
2405
+ "rewards/accuracies": 0.9937499761581421,
2406
+ "rewards/chosen": -2.719921827316284,
2407
+ "rewards/margins": 17.65625,
2408
+ "rewards/rejected": -20.381250381469727,
2409
+ "step": 725
2410
+ },
2411
+ {
2412
+ "epoch": 0.6340933767643865,
2413
+ "grad_norm": 0.7277128100395203,
2414
+ "learning_rate": 2.5732808164740634e-05,
2415
+ "logits/chosen": -1.0881836414337158,
2416
+ "logits/rejected": -1.5712890625,
2417
+ "logps/chosen": -102.1875,
2418
+ "logps/rejected": -225.875,
2419
+ "loss": 0.0202,
2420
+ "rewards/accuracies": 0.996874988079071,
2421
+ "rewards/chosen": -2.8536133766174316,
2422
+ "rewards/margins": 17.546875,
2423
+ "rewards/rejected": -20.390625,
2424
+ "step": 730
2425
+ },
2426
+ {
2427
+ "epoch": 0.6384364820846905,
2428
+ "grad_norm": 2.4315991401672363,
2429
+ "learning_rate": 2.5728703742033047e-05,
2430
+ "logits/chosen": -1.0305664539337158,
2431
+ "logits/rejected": -1.572656273841858,
2432
+ "logps/chosen": -100.61250305175781,
2433
+ "logps/rejected": -218.1750030517578,
2434
+ "loss": 0.0522,
2435
+ "rewards/accuracies": 0.987500011920929,
2436
+ "rewards/chosen": -2.8978514671325684,
2437
+ "rewards/margins": 16.684375762939453,
2438
+ "rewards/rejected": -19.587499618530273,
2439
+ "step": 735
2440
+ },
2441
+ {
2442
+ "epoch": 0.6427795874049945,
2443
+ "grad_norm": 0.8356490135192871,
2444
+ "learning_rate": 2.5724567263280155e-05,
2445
+ "logits/chosen": -1.006445288658142,
2446
+ "logits/rejected": -1.5927734375,
2447
+ "logps/chosen": -101.0,
2448
+ "logps/rejected": -210.22500610351562,
2449
+ "loss": 0.0369,
2450
+ "rewards/accuracies": 0.987500011920929,
2451
+ "rewards/chosen": -2.7152342796325684,
2452
+ "rewards/margins": 15.609375,
2453
+ "rewards/rejected": -18.337499618530273,
2454
+ "step": 740
2455
+ },
2456
+ {
2457
+ "epoch": 0.6471226927252985,
2458
+ "grad_norm": 0.9469047784805298,
2459
+ "learning_rate": 2.5720398738895534e-05,
2460
+ "logits/chosen": -0.9302734136581421,
2461
+ "logits/rejected": -1.529296875,
2462
+ "logps/chosen": -98.8375015258789,
2463
+ "logps/rejected": -204.625,
2464
+ "loss": 0.0399,
2465
+ "rewards/accuracies": 0.9921875,
2466
+ "rewards/chosen": -2.419726610183716,
2467
+ "rewards/margins": 14.510937690734863,
2468
+ "rewards/rejected": -16.928125381469727,
2469
+ "step": 745
2470
+ },
2471
+ {
2472
+ "epoch": 0.6514657980456026,
2473
+ "grad_norm": 0.25593864917755127,
2474
+ "learning_rate": 2.571619817937344e-05,
2475
+ "logits/chosen": -0.8580077886581421,
2476
+ "logits/rejected": -1.470703125,
2477
+ "logps/chosen": -101.9625015258789,
2478
+ "logps/rejected": -205.14999389648438,
2479
+ "loss": 0.0313,
2480
+ "rewards/accuracies": 0.9906250238418579,
2481
+ "rewards/chosen": -2.443164110183716,
2482
+ "rewards/margins": 14.162500381469727,
2483
+ "rewards/rejected": -16.6015625,
2484
+ "step": 750
2485
+ },
2486
+ {
2487
+ "epoch": 0.6514657980456026,
2488
+ "eval_logits/chosen": -0.7763848304748535,
2489
+ "eval_logits/rejected": -1.4033167362213135,
2490
+ "eval_logps/chosen": -98.74909973144531,
2491
+ "eval_logps/rejected": -200.59567260742188,
2492
+ "eval_loss": 0.021692628040909767,
2493
+ "eval_rewards/accuracies": 0.9925541281700134,
2494
+ "eval_rewards/chosen": -2.211261749267578,
2495
+ "eval_rewards/margins": 13.938854217529297,
2496
+ "eval_rewards/rejected": -16.1518497467041,
2497
+ "eval_runtime": 97.7492,
2498
+ "eval_samples_per_second": 45.218,
2499
+ "eval_steps_per_second": 2.834,
2500
+ "step": 750
2501
  }
2502
  ],
2503
  "logging_steps": 5,