guyhadad01 commited on
Commit
d988e26
·
verified ·
1 Parent(s): 728f48d

Training in progress, step 27400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1205,6 +1205,10 @@ You can finetune this model on your own dataset.
1205
  | 0.4789 | 27100 | 0.2753 |
1206
  | 0.4798 | 27150 | 0.35 |
1207
  | 0.4806 | 27200 | 0.3143 |
 
 
 
 
1208
 
1209
 
1210
  ### Framework Versions
 
1205
  | 0.4789 | 27100 | 0.2753 |
1206
  | 0.4798 | 27150 | 0.35 |
1207
  | 0.4806 | 27200 | 0.3143 |
1208
+ | 0.4815 | 27250 | 0.3968 |
1209
+ | 0.4824 | 27300 | 0.3246 |
1210
+ | 0.4833 | 27350 | 0.3131 |
1211
+ | 0.4842 | 27400 | 0.3078 |
1212
 
1213
 
1214
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08045e1f2a8cd2432e9fa2b0ef00df2ac4ced1a000f41148266acaf751aa00fe
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e42bafc26f64fc942eebe9b36d05cb9ebd690bc7e84350aba5ef5927bebd23aa
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91e8be442cecb8de3b11e871dbe4b21251728bce4db99665346a4ae741dd9661
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86493a89e1b924fce58823b6948f096f29423c5ce2b1e2b2de815c28e7f95699
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:527a9946e2b187cf3aeaac98a6c12f5dc108889d1a7d08a9def35306b103680a
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1ffba3c8137c0af09582c28fee3245b77ce6875ddb2ff1a79f1003af6257b2b
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6d84e0b16c16a3884265f119b778a7531d56abad22c7b0d844e8a1a93c8456c
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d79db97c4b1cd4a4d432cc88a5b1b07dc74a6838264e86b10e57ab5d0be29f45
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1ac0dfa5e821d2ce353420d7dc3f3a06dc98c820a2502851855c1f7447269ad
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10c98a9a1e72b7cb62494c74d5b84c2a61b0c8fb7089e16aa24c2bd64d181a5f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.48064179816578606,
6
  "eval_steps": 500,
7
- "global_step": 27200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3816,6 +3816,34 @@
3816
  "learning_rate": 2.8863560503426205e-05,
3817
  "loss": 0.3143,
3818
  "step": 27200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3819
  }
3820
  ],
3821
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.4841759290346522,
6
  "eval_steps": 500,
7
+ "global_step": 27400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3816
  "learning_rate": 2.8863560503426205e-05,
3817
  "loss": 0.3143,
3818
  "step": 27200
3819
+ },
3820
+ {
3821
+ "epoch": 0.4815253308830026,
3822
+ "grad_norm": 1.6409038305282593,
3823
+ "learning_rate": 2.8814474485087667e-05,
3824
+ "loss": 0.3968,
3825
+ "step": 27250
3826
+ },
3827
+ {
3828
+ "epoch": 0.4824088636002191,
3829
+ "grad_norm": 1.4830607175827026,
3830
+ "learning_rate": 2.876538846674913e-05,
3831
+ "loss": 0.3246,
3832
+ "step": 27300
3833
+ },
3834
+ {
3835
+ "epoch": 0.48329239631743565,
3836
+ "grad_norm": 1.6359367370605469,
3837
+ "learning_rate": 2.87163024484106e-05,
3838
+ "loss": 0.3131,
3839
+ "step": 27350
3840
+ },
3841
+ {
3842
+ "epoch": 0.4841759290346522,
3843
+ "grad_norm": 1.1834681034088135,
3844
+ "learning_rate": 2.8667216430072057e-05,
3845
+ "loss": 0.3078,
3846
+ "step": 27400
3847
  }
3848
  ],
3849
  "logging_steps": 50,