Reggie commited on
Commit
20996dd
·
verified ·
1 Parent(s): 39da7ec

Training in progress, step 2400, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a227244b79f305f140948c1079fcdc545f071391bb7e4ff9cf542a898d157d1c
3
  size 69782384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e881eea67951f715a0412c658550fa6656f80eb9c2e7babf1715b545a2d6c453
3
  size 69782384
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9e0d7d55f9a230dad78340581c7686c5db109d5d23cb37fd0af07013b1770c4
3
  size 139790651
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d4dbaa4a93c925e7206f796b1b5cb1d4f8097fcd0cada8da8eca9fa94e98a40
3
  size 139790651
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:92bebe68c4903b16edae13a87b639062f86297d20f12bfc3a43205a7d64356a6
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a29859d5dfe7ec5553a7575bdf1fff1111c940a25116f4b3204c18d1ea7bcdb7
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42a9c19735c8da4979dd9d9844a70622260a91c03b4b752eeed5aefa51d6bbfb
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ebdfd2092dbf93cc1de964feb5cc7ccb4c109e2c86de6e8d8008013b0ca48f9
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 1800,
3
  "best_metric": 2.1885855197906494,
4
  "best_model_checkpoint": "./outputs/checkpoint-1800",
5
- "epoch": 2.3887079261672097,
6
  "eval_steps": 200,
7
- "global_step": 2200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -404,6 +404,42 @@
404
  "eval_samples_per_second": 81.956,
405
  "eval_steps_per_second": 2.587,
406
  "step": 2200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
407
  }
408
  ],
409
  "logging_steps": 50,
@@ -418,7 +454,7 @@
418
  "early_stopping_threshold": 0.0
419
  },
420
  "attributes": {
421
- "early_stopping_patience_counter": 2
422
  }
423
  },
424
  "TrainerControl": {
@@ -427,12 +463,12 @@
427
  "should_evaluate": false,
428
  "should_log": false,
429
  "should_save": true,
430
- "should_training_stop": false
431
  },
432
  "attributes": {}
433
  }
434
  },
435
- "total_flos": 6.162730083190702e+17,
436
  "train_batch_size": 32,
437
  "trial_name": null,
438
  "trial_params": null
 
2
  "best_global_step": 1800,
3
  "best_metric": 2.1885855197906494,
4
  "best_model_checkpoint": "./outputs/checkpoint-1800",
5
+ "epoch": 2.6058631921824107,
6
  "eval_steps": 200,
7
+ "global_step": 2400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
404
  "eval_samples_per_second": 81.956,
405
  "eval_steps_per_second": 2.587,
406
  "step": 2200
407
+ },
408
+ {
409
+ "epoch": 2.44299674267101,
410
+ "grad_norm": 1.4523568153381348,
411
+ "learning_rate": 1.7196383108428315e-05,
412
+ "loss": 2.1359,
413
+ "step": 2250
414
+ },
415
+ {
416
+ "epoch": 2.49728555917481,
417
+ "grad_norm": 1.3263523578643799,
418
+ "learning_rate": 1.4090705132619631e-05,
419
+ "loss": 2.1206,
420
+ "step": 2300
421
+ },
422
+ {
423
+ "epoch": 2.5515743756786105,
424
+ "grad_norm": 1.4148005247116089,
425
+ "learning_rate": 1.1272938645118803e-05,
426
+ "loss": 2.1314,
427
+ "step": 2350
428
+ },
429
+ {
430
+ "epoch": 2.6058631921824107,
431
+ "grad_norm": 1.9476280212402344,
432
+ "learning_rate": 8.752526947077045e-06,
433
+ "loss": 2.1254,
434
+ "step": 2400
435
+ },
436
+ {
437
+ "epoch": 2.6058631921824107,
438
+ "eval_loss": 2.189617395401001,
439
+ "eval_runtime": 7.3524,
440
+ "eval_samples_per_second": 81.878,
441
+ "eval_steps_per_second": 2.584,
442
+ "step": 2400
443
  }
444
  ],
445
  "logging_steps": 50,
 
454
  "early_stopping_threshold": 0.0
455
  },
456
  "attributes": {
457
+ "early_stopping_patience_counter": 3
458
  }
459
  },
460
  "TrainerControl": {
 
463
  "should_evaluate": false,
464
  "should_log": false,
465
  "should_save": true,
466
+ "should_training_stop": true
467
  },
468
  "attributes": {}
469
  }
470
  },
471
+ "total_flos": 6.723721683521372e+17,
472
  "train_batch_size": 32,
473
  "trial_name": null,
474
  "trial_params": null