mgh6 commited on
Commit
8d22e31
·
verified ·
1 Parent(s): 52d5acb

Training in progress, step 4500, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17354674ebfd7ee39e27d2d7c18efe07ba47500bf6960899f0eafdf72eead626
3
  size 136000488
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc8084e5d2f40c117fb67d150045799cf2c3cae6229373318b8bd37a0a605209
3
  size 136000488
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ffd1ca3853498761f71027ee26ab56f29b18b7339583b6e4060a60d4b7e6d35
3
  size 268176506
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4575ef57c4ebf8ade03a543a393b32ae16e5578f529ef3653494f07df3f0f2d
3
  size 268176506
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b88a294175177dc754ff5113f4db5f5889ecf637e68dfb3e98c14246dd8d3714
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f21d552e0b8edeac4b814e68abd63ad5a2fa0f0f0b7c2bf9dd3d572dde4cd39
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70db09ddd19e86007f322d281cc5c5f94909d942e37598ec3ceaa08be20aecba
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b4f9a397f8fb58627464d50119035e3cc721b6c9f0cc18f4836a495d9182e5f
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:598c58dd54a328d92dfc9ab91d559118e55f09ef3e6d1a542d0d2ba34a4f7769
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:736c0a3c5e9cad8a63099122bc81fcfe6c1a1da1f52783fd5ab9a0a79f0525e7
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1529a258db9857087589ba7d21800b6cb787f5ab31dae6d6c97ea8d5a4171643
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:182d0fd1f95f38608a11f6b6579d63e24538540d9ce9b05d123e02020b4a25cf
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49ae85bf7a65e337693025f4ceb61bc3ab49ed353192027ce2cc225b05fa7ea5
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6a126727af8bb09352afcee26a5ce13ba782b7b555b31ebe9b3deaff7994ff9
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.78049236536026,
3
  "best_model_checkpoint": "mgh6/TCS_MLM/checkpoint-4200",
4
- "epoch": 5.890227576974565,
5
  "eval_steps": 100,
6
- "global_step": 4400,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -667,6 +667,21 @@
667
  "eval_samples_per_second": 886.234,
668
  "eval_steps_per_second": 3.581,
669
  "step": 4400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
670
  }
671
  ],
672
  "logging_steps": 100,
@@ -681,7 +696,7 @@
681
  "early_stopping_threshold": 0.0
682
  },
683
  "attributes": {
684
- "early_stopping_patience_counter": 2
685
  }
686
  },
687
  "TrainerControl": {
@@ -695,7 +710,7 @@
695
  "attributes": {}
696
  }
697
  },
698
- "total_flos": 1.59773991370752e+17,
699
  "train_batch_size": 64,
700
  "trial_name": null,
701
  "trial_params": null
 
1
  {
2
  "best_metric": 0.78049236536026,
3
  "best_model_checkpoint": "mgh6/TCS_MLM/checkpoint-4200",
4
+ "epoch": 6.024096385542169,
5
  "eval_steps": 100,
6
+ "global_step": 4500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
667
  "eval_samples_per_second": 886.234,
668
  "eval_steps_per_second": 3.581,
669
  "step": 4400
670
+ },
671
+ {
672
+ "epoch": 6.024096385542169,
673
+ "grad_norm": 0.19529978930950165,
674
+ "learning_rate": 0.00039759036144578315,
675
+ "loss": 0.7329,
676
+ "step": 4500
677
+ },
678
+ {
679
+ "epoch": 6.024096385542169,
680
+ "eval_loss": 0.7827839851379395,
681
+ "eval_runtime": 6.3652,
682
+ "eval_samples_per_second": 894.234,
683
+ "eval_steps_per_second": 3.613,
684
+ "step": 4500
685
  }
686
  ],
687
  "logging_steps": 100,
 
696
  "early_stopping_threshold": 0.0
697
  },
698
  "attributes": {
699
+ "early_stopping_patience_counter": 3
700
  }
701
  },
702
  "TrainerControl": {
 
710
  "attributes": {}
711
  }
712
  },
713
+ "total_flos": 1.6340521844736e+17,
714
  "train_batch_size": 64,
715
  "trial_name": null,
716
  "trial_params": null