guyhadad01 commited on
Commit
aab9cfb
·
verified ·
1 Parent(s): ae35f2b

Training in progress, step 27600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1209,6 +1209,10 @@ You can finetune this model on your own dataset.
1209
  | 0.4824 | 27300 | 0.3246 |
1210
  | 0.4833 | 27350 | 0.3131 |
1211
  | 0.4842 | 27400 | 0.3078 |
 
 
 
 
1212
 
1213
 
1214
  ### Framework Versions
 
1209
  | 0.4824 | 27300 | 0.3246 |
1210
  | 0.4833 | 27350 | 0.3131 |
1211
  | 0.4842 | 27400 | 0.3078 |
1212
+ | 0.4851 | 27450 | 0.419 |
1213
+ | 0.4859 | 27500 | 0.3959 |
1214
+ | 0.4868 | 27550 | 0.3754 |
1215
+ | 0.4877 | 27600 | 0.3163 |
1216
 
1217
 
1218
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e42bafc26f64fc942eebe9b36d05cb9ebd690bc7e84350aba5ef5927bebd23aa
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7664a0a0f5ecfa598f2701a1ff37b213f978409532fb7f103898692f18c2a725
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:86493a89e1b924fce58823b6948f096f29423c5ce2b1e2b2de815c28e7f95699
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9a099107f68059125238e954d06fc6e590362c99b51020b9fe7fdd85f6a409e
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1ffba3c8137c0af09582c28fee3245b77ce6875ddb2ff1a79f1003af6257b2b
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e5363905a5180ae7b6dc66d9d24e9725568295ce2578c5fa9423e53d3f4ca3e
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d79db97c4b1cd4a4d432cc88a5b1b07dc74a6838264e86b10e57ab5d0be29f45
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01018da1a415cc4a2591785629b35e825cfe5ca85d564c2b7250cf57ca5ee003
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10c98a9a1e72b7cb62494c74d5b84c2a61b0c8fb7089e16aa24c2bd64d181a5f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52a4e22174e8f57aba7a9808391b59167576034c6b53740dc89da4532411a156
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.4841759290346522,
6
  "eval_steps": 500,
7
- "global_step": 27400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3844,6 +3844,34 @@
3844
  "learning_rate": 2.8667216430072057e-05,
3845
  "loss": 0.3078,
3846
  "step": 27400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3847
  }
3848
  ],
3849
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.48771005990351823,
6
  "eval_steps": 500,
7
+ "global_step": 27600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3844
  "learning_rate": 2.8667216430072057e-05,
3845
  "loss": 0.3078,
3846
  "step": 27400
3847
+ },
3848
+ {
3849
+ "epoch": 0.48505946175186865,
3850
+ "grad_norm": 1.3667497634887695,
3851
+ "learning_rate": 2.8618130411733522e-05,
3852
+ "loss": 0.419,
3853
+ "step": 27450
3854
+ },
3855
+ {
3856
+ "epoch": 0.4859429944690852,
3857
+ "grad_norm": 4.66032075881958,
3858
+ "learning_rate": 2.856904439339499e-05,
3859
+ "loss": 0.3959,
3860
+ "step": 27500
3861
+ },
3862
+ {
3863
+ "epoch": 0.4868265271863017,
3864
+ "grad_norm": 1.530393362045288,
3865
+ "learning_rate": 2.8519958375056448e-05,
3866
+ "loss": 0.3754,
3867
+ "step": 27550
3868
+ },
3869
+ {
3870
+ "epoch": 0.48771005990351823,
3871
+ "grad_norm": 0.9399372935295105,
3872
+ "learning_rate": 2.8470872356717916e-05,
3873
+ "loss": 0.3163,
3874
+ "step": 27600
3875
  }
3876
  ],
3877
  "logging_steps": 50,