FormlessAI commited on
Commit
cbae320
·
verified ·
1 Parent(s): 1c1b51a

Training in progress, epoch 7, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49db62516068e315a0097a3075f5d9eed4dabca56b289242354c5050a5096985
3
  size 555780720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86839f7e37cf9db50d92aa3359c8a951b16bcb9bd19179d97785c9380e60d4de
3
  size 555780720
last-checkpoint/global_step1352/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa5f32f83b8dd1abdff17aa4d8a62cf2df4d05afc1f775aa2f6b93598139e4b4
3
+ size 418993765
last-checkpoint/global_step1352/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fc2fc0cd5ce123568d266b89c4f539a173812273213ba02d058dfdf7b623daf
3
+ size 418993829
last-checkpoint/global_step1352/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd31753cbe0128c999d089e0b6ae68cd9dc9534e5009bc8833ba113b6cfc75e4
3
+ size 418993829
last-checkpoint/global_step1352/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a79f62be1ee42d6d4cdaa1d1ae0c25bb27a3f27a7ee18554197caf2fc8ddc5d
3
+ size 418993829
last-checkpoint/global_step1352/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c178a80caac549930759dd5ddeae56a0eebd44125e85347a79d3546d5ea720a
3
+ size 555959385
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step1302
 
1
+ global_step1352
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:091086836d56ce2653ecffb0ae0f470c5a0c8f5e4a0321adebb5dd8b3f287883
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95a3c87bc88363e3f4b77947b12ea79773944af0114a1b604be41b603f0e088e
3
  size 15429
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3875f6c478f16e9290e84b32d47c7894416bef16616ab5dfccda0fa82d7497c4
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:339163084457ee5fe928af6d9e73b4f74db7625bc6e88a289af439ef57976bfb
3
  size 15429
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28580ca8aa74ba18bb130eb4176d6089e133b9d613d7916e228f3be22455fa61
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d12472ec366ee397869b0f92eb4add458e30b5e37a8a371422c324e97a75e38b
3
  size 15429
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7562bb51e5532124c41799cff8e5925d7e80b45c0e9f1a3be4f480ba2d42417
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20f7fa0cdcee712ddbb996fd4afd5bdb4a4fcb884815462037415fce9b45978
3
  size 15429
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d67d662c9022ab09c104c0ce3351b238323049b4af79030deb9d3b09a56fd83b
3
  size 1401
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06ca58d1a0dee9bbca88545d604f59334241351618fe2f019276217fe27d5f25
3
  size 1401
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
  "best_global_step": null,
3
- "best_metric": 0.15382565557956696,
4
  "best_model_checkpoint": null,
5
- "epoch": 7.064996614759648,
6
  "eval_steps": 50,
7
- "global_step": 1300,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4324,6 +4324,172 @@
4324
  "eval_samples_per_second": 44.586,
4325
  "eval_steps_per_second": 2.834,
4326
  "step": 1300
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4327
  }
4328
  ],
4329
  "logging_steps": 5,
 
1
  {
2
  "best_global_step": null,
3
+ "best_metric": 0.13855531811714172,
4
  "best_model_checkpoint": null,
5
+ "epoch": 7.3358158429248475,
6
  "eval_steps": 50,
7
+ "global_step": 1350,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4324
  "eval_samples_per_second": 44.586,
4325
  "eval_steps_per_second": 2.834,
4326
  "step": 1300
4327
+ },
4328
+ {
4329
+ "epoch": 7.0920785375761675,
4330
+ "grad_norm": 0.9328561425209045,
4331
+ "learning_rate": 1.2436575721991239e-05,
4332
+ "logits/chosen": -0.8173828125,
4333
+ "logits/rejected": NaN,
4334
+ "logps/chosen": -368.45001220703125,
4335
+ "logps/rejected": -367.8500061035156,
4336
+ "loss": 0.1569,
4337
+ "rewards/accuracies": 0.9453125,
4338
+ "rewards/chosen": -7.185156345367432,
4339
+ "rewards/margins": 3.2300782203674316,
4340
+ "rewards/rejected": -10.420312881469727,
4341
+ "step": 1305
4342
+ },
4343
+ {
4344
+ "epoch": 7.1191604603926875,
4345
+ "grad_norm": 1.522709608078003,
4346
+ "learning_rate": 1.2432752041311519e-05,
4347
+ "logits/chosen": -0.8003906011581421,
4348
+ "logits/rejected": -0.82373046875,
4349
+ "logps/chosen": -369.20001220703125,
4350
+ "logps/rejected": -381.8999938964844,
4351
+ "loss": 0.1374,
4352
+ "rewards/accuracies": 0.9468749761581421,
4353
+ "rewards/chosen": -6.989062309265137,
4354
+ "rewards/margins": 3.359375,
4355
+ "rewards/rejected": -10.346875190734863,
4356
+ "step": 1310
4357
+ },
4358
+ {
4359
+ "epoch": 7.1462423832092075,
4360
+ "grad_norm": 1.6700057983398438,
4361
+ "learning_rate": 1.2428913301215597e-05,
4362
+ "logits/chosen": NaN,
4363
+ "logits/rejected": -0.8626953363418579,
4364
+ "logps/chosen": -356.04998779296875,
4365
+ "logps/rejected": -373.29998779296875,
4366
+ "loss": 0.1575,
4367
+ "rewards/accuracies": 0.934374988079071,
4368
+ "rewards/chosen": -6.440625190734863,
4369
+ "rewards/margins": 3.438671827316284,
4370
+ "rewards/rejected": -9.872655868530273,
4371
+ "step": 1315
4372
+ },
4373
+ {
4374
+ "epoch": 7.1733243060257275,
4375
+ "grad_norm": 1.6624808311462402,
4376
+ "learning_rate": 1.2425059511367494e-05,
4377
+ "logits/chosen": -0.8272460699081421,
4378
+ "logits/rejected": -0.835644543170929,
4379
+ "logps/chosen": -361.6000061035156,
4380
+ "logps/rejected": -364.6000061035156,
4381
+ "loss": 0.1679,
4382
+ "rewards/accuracies": 0.940625011920929,
4383
+ "rewards/chosen": -6.254687309265137,
4384
+ "rewards/margins": 3.313281297683716,
4385
+ "rewards/rejected": -9.573437690734863,
4386
+ "step": 1320
4387
+ },
4388
+ {
4389
+ "epoch": 7.2004062288422475,
4390
+ "grad_norm": 2.2478160858154297,
4391
+ "learning_rate": 1.2421190681469124e-05,
4392
+ "logits/chosen": -0.782519519329071,
4393
+ "logits/rejected": NaN,
4394
+ "logps/chosen": -355.54998779296875,
4395
+ "logps/rejected": -364.625,
4396
+ "loss": 0.1743,
4397
+ "rewards/accuracies": 0.9437500238418579,
4398
+ "rewards/chosen": -6.853125095367432,
4399
+ "rewards/margins": 2.9222655296325684,
4400
+ "rewards/rejected": -9.770312309265137,
4401
+ "step": 1325
4402
+ },
4403
+ {
4404
+ "epoch": 7.2274881516587675,
4405
+ "grad_norm": 1.1094180345535278,
4406
+ "learning_rate": 1.241730682126026e-05,
4407
+ "logits/chosen": NaN,
4408
+ "logits/rejected": -0.796191394329071,
4409
+ "logps/chosen": -369.8500061035156,
4410
+ "logps/rejected": -372.1000061035156,
4411
+ "loss": 0.1671,
4412
+ "rewards/accuracies": 0.953125,
4413
+ "rewards/chosen": -7.446875095367432,
4414
+ "rewards/margins": 2.931640625,
4415
+ "rewards/rejected": -10.378125190734863,
4416
+ "step": 1330
4417
+ },
4418
+ {
4419
+ "epoch": 7.2545700744752875,
4420
+ "grad_norm": 1.275765299797058,
4421
+ "learning_rate": 1.2413407940518518e-05,
4422
+ "logits/chosen": -0.8089843988418579,
4423
+ "logits/rejected": -0.8099609613418579,
4424
+ "logps/chosen": -370.5,
4425
+ "logps/rejected": -388.04998779296875,
4426
+ "loss": 0.1589,
4427
+ "rewards/accuracies": 0.9453125,
4428
+ "rewards/chosen": -7.414843559265137,
4429
+ "rewards/margins": 3.5,
4430
+ "rewards/rejected": -10.917187690734863,
4431
+ "step": 1335
4432
+ },
4433
+ {
4434
+ "epoch": 7.2816519972918075,
4435
+ "grad_norm": 1.6279685497283936,
4436
+ "learning_rate": 1.2409494049059322e-05,
4437
+ "logits/chosen": NaN,
4438
+ "logits/rejected": -0.7696288824081421,
4439
+ "logps/chosen": -366.95001220703125,
4440
+ "logps/rejected": -403.3500061035156,
4441
+ "loss": 0.1804,
4442
+ "rewards/accuracies": 0.9296875,
4443
+ "rewards/chosen": -7.529687404632568,
4444
+ "rewards/margins": 3.614453077316284,
4445
+ "rewards/rejected": -11.146875381469727,
4446
+ "step": 1340
4447
+ },
4448
+ {
4449
+ "epoch": 7.3087339201083275,
4450
+ "grad_norm": 1.6767570972442627,
4451
+ "learning_rate": 1.2405565156735891e-05,
4452
+ "logits/chosen": -0.6883789300918579,
4453
+ "logits/rejected": -0.69970703125,
4454
+ "logps/chosen": -386.6499938964844,
4455
+ "logps/rejected": -387.95001220703125,
4456
+ "loss": 0.1821,
4457
+ "rewards/accuracies": 0.925000011920929,
4458
+ "rewards/chosen": -7.953906059265137,
4459
+ "rewards/margins": 3.3148436546325684,
4460
+ "rewards/rejected": -11.268750190734863,
4461
+ "step": 1345
4462
+ },
4463
+ {
4464
+ "epoch": 7.3358158429248475,
4465
+ "grad_norm": 1.182672142982483,
4466
+ "learning_rate": 1.2401621273439206e-05,
4467
+ "logits/chosen": -0.683789074420929,
4468
+ "logits/rejected": -0.6509765386581421,
4469
+ "logps/chosen": -375.29998779296875,
4470
+ "logps/rejected": -388.8999938964844,
4471
+ "loss": 0.1432,
4472
+ "rewards/accuracies": 0.949999988079071,
4473
+ "rewards/chosen": -7.917187690734863,
4474
+ "rewards/margins": 3.202343702316284,
4475
+ "rewards/rejected": -11.123437881469727,
4476
+ "step": 1350
4477
+ },
4478
+ {
4479
+ "epoch": 7.3358158429248475,
4480
+ "eval_logits/chosen": -0.6861979365348816,
4481
+ "eval_logits/rejected": NaN,
4482
+ "eval_logps/chosen": -375.1111145019531,
4483
+ "eval_logps/rejected": -389.20001220703125,
4484
+ "eval_loss": 0.13855531811714172,
4485
+ "eval_rewards/accuracies": 0.9513888955116272,
4486
+ "eval_rewards/chosen": -7.346527576446533,
4487
+ "eval_rewards/margins": 3.3333332538604736,
4488
+ "eval_rewards/rejected": -10.679166793823242,
4489
+ "eval_runtime": 15.8625,
4490
+ "eval_samples_per_second": 44.634,
4491
+ "eval_steps_per_second": 2.837,
4492
+ "step": 1350
4493
  }
4494
  ],
4495
  "logging_steps": 5,