guyhadad01 commited on
Commit
eb6dcbc
·
verified ·
1 Parent(s): ace7cc9

Training in progress, step 27800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1213,6 +1213,10 @@ You can finetune this model on your own dataset.
1213
  | 0.4859 | 27500 | 0.3959 |
1214
  | 0.4868 | 27550 | 0.3754 |
1215
  | 0.4877 | 27600 | 0.3163 |
 
 
 
 
1216
 
1217
 
1218
  ### Framework Versions
 
1213
  | 0.4859 | 27500 | 0.3959 |
1214
  | 0.4868 | 27550 | 0.3754 |
1215
  | 0.4877 | 27600 | 0.3163 |
1216
+ | 0.4886 | 27650 | 0.35 |
1217
+ | 0.4895 | 27700 | 0.3397 |
1218
+ | 0.4904 | 27750 | 0.3853 |
1219
+ | 0.4912 | 27800 | 0.2568 |
1220
 
1221
 
1222
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7664a0a0f5ecfa598f2701a1ff37b213f978409532fb7f103898692f18c2a725
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdfacab69b0182b267f66ce210afc2a929861f8a381fcb609abe7250efbad353
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c9a099107f68059125238e954d06fc6e590362c99b51020b9fe7fdd85f6a409e
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d101e20d6391c1d00393694ed7c13a8ed5d54b7059e36795228521dd1687fa5d
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e5363905a5180ae7b6dc66d9d24e9725568295ce2578c5fa9423e53d3f4ca3e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6ca64734da2f01bf95a86973d81c98cfbac0699ced506e6f5d14bfc6d5da161
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01018da1a415cc4a2591785629b35e825cfe5ca85d564c2b7250cf57ca5ee003
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e43246be50aae83c1910a5dc4ce6db1d2f843a5836c33c56704984643d301b0e
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52a4e22174e8f57aba7a9808391b59167576034c6b53740dc89da4532411a156
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6ed64f7e529220ff21286b422216dac7ffe45f3b61319d3fedf56a8725ea92a
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.48771005990351823,
6
  "eval_steps": 500,
7
- "global_step": 27600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3872,6 +3872,34 @@
3872
  "learning_rate": 2.8470872356717916e-05,
3873
  "loss": 0.3163,
3874
  "step": 27600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3875
  }
3876
  ],
3877
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.4912441907723843,
6
  "eval_steps": 500,
7
+ "global_step": 27800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3872
  "learning_rate": 2.8470872356717916e-05,
3873
  "loss": 0.3163,
3874
  "step": 27600
3875
+ },
3876
+ {
3877
+ "epoch": 0.48859359262073476,
3878
+ "grad_norm": 1.654520869255066,
3879
+ "learning_rate": 2.8421786338379374e-05,
3880
+ "loss": 0.35,
3881
+ "step": 27650
3882
+ },
3883
+ {
3884
+ "epoch": 0.4894771253379513,
3885
+ "grad_norm": 1.5777958631515503,
3886
+ "learning_rate": 2.8372700320040842e-05,
3887
+ "loss": 0.3397,
3888
+ "step": 27700
3889
+ },
3890
+ {
3891
+ "epoch": 0.49036065805516776,
3892
+ "grad_norm": 1.4474226236343384,
3893
+ "learning_rate": 2.8323614301702307e-05,
3894
+ "loss": 0.3853,
3895
+ "step": 27750
3896
+ },
3897
+ {
3898
+ "epoch": 0.4912441907723843,
3899
+ "grad_norm": 1.603667140007019,
3900
+ "learning_rate": 2.8274528283363765e-05,
3901
+ "loss": 0.2568,
3902
+ "step": 27800
3903
  }
3904
  ],
3905
  "logging_steps": 50,