goyalayus commited on
Commit
21c8186
·
verified ·
1 Parent(s): 4da99e9

Training in progress, step 60, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91bb60ee728b069aa96221d8ddccb205b6bc74d3bca5226195d5183927e804d3
3
  size 84962944
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:949efa076e0641b1bf7440dda4aab0946a6a70724436d0a3ab83660acc1403a2
3
  size 84962944
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:03f9d860f1e0dbfcdf53555855f9a4471528bf8427d37dfee8a9a003117159ba
3
  size 43387339
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dec3f6f7548b6834b8d8ed0bb9b69af9d9af621c9a1dab11b386eec355c7f0e6
3
  size 43387339
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71a794c77d91f4dc788c1a70f8619fb0ed76a6803da809d3d2d5f646f92481fb
3
  size 14709
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53b3a001f6f9b4c549f0bf73e88f33314cd5b26b892e872aa6828133fc723ff8
3
  size 14709
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7dce57d520a5c903ee4baddf780c2b9cb084140d3e348fde0a802253d3fe502b
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cbdc6c8f1d58fbcd97eca64ad0c1660e5abc38fd1422e1f599bdd89ec16b796
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 55,
3
- "best_metric": 1.7220358848571777,
4
- "best_model_checkpoint": "./outputs/ctrl_abort_right/checkpoint-55",
5
- "epoch": 0.11783610069630424,
6
  "eval_steps": 5,
7
- "global_step": 55,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -481,6 +481,49 @@
481
  "eval_samples_per_second": 14.023,
482
  "eval_steps_per_second": 7.011,
483
  "step": 55
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
484
  }
485
  ],
486
  "logging_steps": 1,
@@ -504,12 +547,12 @@
504
  "should_evaluate": false,
505
  "should_log": false,
506
  "should_save": true,
507
- "should_training_stop": false
508
  },
509
  "attributes": {}
510
  }
511
  },
512
- "total_flos": 5508695710003200.0,
513
  "train_batch_size": 2,
514
  "trial_name": null,
515
  "trial_params": null
 
1
  {
2
+ "best_global_step": 60,
3
+ "best_metric": 1.7189992666244507,
4
+ "best_model_checkpoint": "./outputs/ctrl_abort_right/checkpoint-60",
5
+ "epoch": 0.12854847348687734,
6
  "eval_steps": 5,
7
+ "global_step": 60,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
481
  "eval_samples_per_second": 14.023,
482
  "eval_steps_per_second": 7.011,
483
  "step": 55
484
+ },
485
+ {
486
+ "epoch": 0.11997857525441885,
487
+ "grad_norm": 1.2811716794967651,
488
+ "learning_rate": 2.447174185242324e-07,
489
+ "loss": 1.6783,
490
+ "step": 56
491
+ },
492
+ {
493
+ "epoch": 0.12212104981253348,
494
+ "grad_norm": 1.482115387916565,
495
+ "learning_rate": 1.5708419435684463e-07,
496
+ "loss": 1.8306,
497
+ "step": 57
498
+ },
499
+ {
500
+ "epoch": 0.1242635243706481,
501
+ "grad_norm": 1.1114031076431274,
502
+ "learning_rate": 8.856374635655696e-08,
503
+ "loss": 1.5695,
504
+ "step": 58
505
+ },
506
+ {
507
+ "epoch": 0.12640599892876273,
508
+ "grad_norm": 1.3343108892440796,
509
+ "learning_rate": 3.9426493427611177e-08,
510
+ "loss": 1.6949,
511
+ "step": 59
512
+ },
513
+ {
514
+ "epoch": 0.12854847348687734,
515
+ "grad_norm": 1.162011981010437,
516
+ "learning_rate": 9.866357858642206e-09,
517
+ "loss": 1.5822,
518
+ "step": 60
519
+ },
520
+ {
521
+ "epoch": 0.12854847348687734,
522
+ "eval_loss": 1.7189992666244507,
523
+ "eval_runtime": 1.158,
524
+ "eval_samples_per_second": 13.816,
525
+ "eval_steps_per_second": 6.908,
526
+ "step": 60
527
  }
528
  ],
529
  "logging_steps": 1,
 
547
  "should_evaluate": false,
548
  "should_log": false,
549
  "should_save": true,
550
+ "should_training_stop": true
551
  },
552
  "attributes": {}
553
  }
554
  },
555
+ "total_flos": 6024782336179200.0,
556
  "train_batch_size": 2,
557
  "trial_name": null,
558
  "trial_params": null