PhoenixB commited on
Commit
fffda03
·
verified ·
1 Parent(s): 94ccb17

Training in progress, step 30, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a26a2ff6112a076b5c8539d9ff44f6eaf49e13976e20d6dc004a8a4895aea5e
3
  size 30322120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a635d848d65f59777d485a4cee215eb528eaa458d65014bfd03ab9b8a4b46333
3
  size 30322120
last-checkpoint/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24c8b131cdf809e3bf8e8086ded78bd8082c724112b6b1d3e448f2d873c67bef
3
  size 60854466
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a69bcec7cb99fe2ec8bcacaec1905a1f4eae223090e818b34a18929c6a587604
3
  size 60854466
last-checkpoint/pytorch_model_fsdp.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ca652a881740fc7aa9fa81865c0e8757bd9580b658c87c8125e22e6bfdcaf17
3
  size 30402542
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8f6c735f4230b47f7793f3c236777cea263c2c684b8e532e86f150fc0afc335
3
  size 30402542
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:015707cb16790250630febca682498cb5d3456d5a13443b953687f19dc7d59ed
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2def2cd24154d8cecbaa07c36ae27e5ebb9b7273a78abfea27aa67c480e4ae2b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.008229606007612385,
5
  "eval_steps": 500,
6
- "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -307,6 +307,156 @@
307
  "rewards/margins": 9.52292537689209,
308
  "rewards/rejected": -10.617974281311035,
309
  "step": 20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
310
  }
311
  ],
312
  "logging_steps": 1,
@@ -321,7 +471,7 @@
321
  "should_evaluate": false,
322
  "should_log": false,
323
  "should_save": true,
324
- "should_training_stop": false
325
  },
326
  "attributes": {}
327
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.012344409011418579,
5
  "eval_steps": 500,
6
+ "global_step": 30,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
307
  "rewards/margins": 9.52292537689209,
308
  "rewards/rejected": -10.617974281311035,
309
  "step": 20
310
+ },
311
+ {
312
+ "epoch": 0.008641086307993005,
313
+ "grad_norm": 1.421184778213501,
314
+ "learning_rate": 5.7422070843492734e-05,
315
+ "logits/chosen": -1.2648671865463257,
316
+ "logits/rejected": -1.159667730331421,
317
+ "logps/chosen": -388.2962341308594,
318
+ "logps/rejected": -428.2628479003906,
319
+ "loss": 0.01,
320
+ "rewards/accuracies": 1.0,
321
+ "rewards/chosen": -0.8064693808555603,
322
+ "rewards/margins": 9.668671607971191,
323
+ "rewards/rejected": -10.475141525268555,
324
+ "step": 21
325
+ },
326
+ {
327
+ "epoch": 0.009052566608373624,
328
+ "grad_norm": 0.7935642004013062,
329
+ "learning_rate": 4.6417320502100316e-05,
330
+ "logits/chosen": -1.5795066356658936,
331
+ "logits/rejected": -1.5574439764022827,
332
+ "logps/chosen": -673.1815185546875,
333
+ "logps/rejected": -578.0742797851562,
334
+ "loss": 0.0042,
335
+ "rewards/accuracies": 1.0,
336
+ "rewards/chosen": -1.4215660095214844,
337
+ "rewards/margins": 10.199383735656738,
338
+ "rewards/rejected": -11.620948791503906,
339
+ "step": 22
340
+ },
341
+ {
342
+ "epoch": 0.009464046908754244,
343
+ "grad_norm": 0.5888037085533142,
344
+ "learning_rate": 3.6257601025131026e-05,
345
+ "logits/chosen": -1.356429934501648,
346
+ "logits/rejected": -0.7343645095825195,
347
+ "logps/chosen": -558.6991577148438,
348
+ "logps/rejected": -601.5557861328125,
349
+ "loss": 0.0033,
350
+ "rewards/accuracies": 1.0,
351
+ "rewards/chosen": -0.7459613680839539,
352
+ "rewards/margins": 7.877223968505859,
353
+ "rewards/rejected": -8.623186111450195,
354
+ "step": 23
355
+ },
356
+ {
357
+ "epoch": 0.009875527209134862,
358
+ "grad_norm": 1.5047943592071533,
359
+ "learning_rate": 2.7103137257858868e-05,
360
+ "logits/chosen": -1.4022102355957031,
361
+ "logits/rejected": -1.2865889072418213,
362
+ "logps/chosen": -505.72802734375,
363
+ "logps/rejected": -496.80517578125,
364
+ "loss": 0.0069,
365
+ "rewards/accuracies": 1.0,
366
+ "rewards/chosen": -0.9657745361328125,
367
+ "rewards/margins": 9.834795951843262,
368
+ "rewards/rejected": -10.800569534301758,
369
+ "step": 24
370
+ },
371
+ {
372
+ "epoch": 0.010287007509515483,
373
+ "grad_norm": 10.904205322265625,
374
+ "learning_rate": 1.9098300562505266e-05,
375
+ "logits/chosen": -1.3055310249328613,
376
+ "logits/rejected": -1.1012433767318726,
377
+ "logps/chosen": -544.568115234375,
378
+ "logps/rejected": -463.7269592285156,
379
+ "loss": 0.0883,
380
+ "rewards/accuracies": 0.875,
381
+ "rewards/chosen": -1.7714694738388062,
382
+ "rewards/margins": 10.789080619812012,
383
+ "rewards/rejected": -12.560550689697266,
384
+ "step": 25
385
+ },
386
+ {
387
+ "epoch": 0.010698487809896101,
388
+ "grad_norm": 3.510283946990967,
389
+ "learning_rate": 1.2369331995613665e-05,
390
+ "logits/chosen": -1.4968920946121216,
391
+ "logits/rejected": -1.4846692085266113,
392
+ "logps/chosen": -702.6878051757812,
393
+ "logps/rejected": -574.542236328125,
394
+ "loss": 0.0342,
395
+ "rewards/accuracies": 1.0,
396
+ "rewards/chosen": 0.20018263161182404,
397
+ "rewards/margins": 13.992487907409668,
398
+ "rewards/rejected": -13.792304992675781,
399
+ "step": 26
400
+ },
401
+ {
402
+ "epoch": 0.011109968110276721,
403
+ "grad_norm": 1.6500478982925415,
404
+ "learning_rate": 7.022351411174866e-06,
405
+ "logits/chosen": -1.2855603694915771,
406
+ "logits/rejected": -0.9878661632537842,
407
+ "logps/chosen": -484.6141662597656,
408
+ "logps/rejected": -587.2501831054688,
409
+ "loss": 0.0106,
410
+ "rewards/accuracies": 1.0,
411
+ "rewards/chosen": 0.0036479830741882324,
412
+ "rewards/margins": 11.438243865966797,
413
+ "rewards/rejected": -11.434595108032227,
414
+ "step": 27
415
+ },
416
+ {
417
+ "epoch": 0.01152144841065734,
418
+ "grad_norm": 0.5148972868919373,
419
+ "learning_rate": 3.1416838871368924e-06,
420
+ "logits/chosen": -1.3569444417953491,
421
+ "logits/rejected": -1.2854053974151611,
422
+ "logps/chosen": -412.2033996582031,
423
+ "logps/rejected": -440.2686767578125,
424
+ "loss": 0.0021,
425
+ "rewards/accuracies": 1.0,
426
+ "rewards/chosen": -0.6896465420722961,
427
+ "rewards/margins": 11.664054870605469,
428
+ "rewards/rejected": -12.3537015914917,
429
+ "step": 28
430
+ },
431
+ {
432
+ "epoch": 0.011932928711037958,
433
+ "grad_norm": 1.212573766708374,
434
+ "learning_rate": 7.885298685522235e-07,
435
+ "logits/chosen": -1.547814965248108,
436
+ "logits/rejected": -1.5019885301589966,
437
+ "logps/chosen": -630.9375,
438
+ "logps/rejected": -641.284423828125,
439
+ "loss": 0.0056,
440
+ "rewards/accuracies": 1.0,
441
+ "rewards/chosen": -0.26978832483291626,
442
+ "rewards/margins": 12.407413482666016,
443
+ "rewards/rejected": -12.677202224731445,
444
+ "step": 29
445
+ },
446
+ {
447
+ "epoch": 0.012344409011418579,
448
+ "grad_norm": 1.2990347146987915,
449
+ "learning_rate": 0.0,
450
+ "logits/chosen": -1.6665741205215454,
451
+ "logits/rejected": -1.70499849319458,
452
+ "logps/chosen": -732.9165649414062,
453
+ "logps/rejected": -663.5682983398438,
454
+ "loss": 0.0058,
455
+ "rewards/accuracies": 1.0,
456
+ "rewards/chosen": -0.8148876428604126,
457
+ "rewards/margins": 12.031583786010742,
458
+ "rewards/rejected": -12.846470832824707,
459
+ "step": 30
460
  }
461
  ],
462
  "logging_steps": 1,
 
471
  "should_evaluate": false,
472
  "should_log": false,
473
  "should_save": true,
474
+ "should_training_stop": true
475
  },
476
  "attributes": {}
477
  }