guyhadad01 commited on
Commit
f184216
·
verified ·
1 Parent(s): add4b48

Training in progress, step 1600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -466,9 +466,9 @@ print(embeddings.shape)
466
  # Get the similarity scores for the embeddings
467
  similarities = model.similarity(embeddings, embeddings)
468
  print(similarities)
469
- # tensor([[ 1.0000, 0.5480, -0.0458],
470
- # [ 0.5480, 1.0000, -0.0586],
471
- # [-0.0458, -0.0586, 1.0000]])
472
  ```
473
 
474
  <!--
@@ -704,6 +704,10 @@ You can finetune this model on your own dataset.
704
  | 0.6606 | 1300 | 0.4868 |
705
  | 0.6860 | 1350 | 0.4819 |
706
  | 0.7114 | 1400 | 0.486 |
 
 
 
 
707
 
708
 
709
  ### Framework Versions
 
466
  # Get the similarity scores for the embeddings
467
  similarities = model.similarity(embeddings, embeddings)
468
  print(similarities)
469
+ # tensor([[ 1.0000, 0.5466, -0.0451],
470
+ # [ 0.5466, 1.0000, -0.0569],
471
+ # [-0.0451, -0.0569, 1.0000]])
472
  ```
473
 
474
  <!--
 
704
  | 0.6606 | 1300 | 0.4868 |
705
  | 0.6860 | 1350 | 0.4819 |
706
  | 0.7114 | 1400 | 0.486 |
707
+ | 0.7368 | 1450 | 0.4875 |
708
+ | 0.7622 | 1500 | 0.4874 |
709
+ | 0.7876 | 1550 | 0.4725 |
710
+ | 0.8130 | 1600 | 0.4819 |
711
 
712
 
713
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75920a4e97e5b78b8f2aef96fae35a0db4f205a5343091523547609bce4b1d9f
3
  size 45437864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:854754df8ec84609cad82f36d53d753aec51ba9c534b5f7b71a1982a04c1c64d
3
  size 45437864
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e095a8f770b2b09aeb0a9f8fb5ddd7dac988fa28d75f73b4e4ef2b0581b1b05
3
  size 90346763
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bcd768d6c419625a038d8e3c0adb38c0af2ee7c4104d330447beecd4087778b
3
  size 90346763
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7e4625f78173d74ff3d9f6deda2944ea87976ad1f424f0e59922e3adcae27fc
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f849d8544efef0e1ff23cfbc0ca401c847e9bbacee1179c6d68fa07318aa06b4
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0299032156c99cc748a49daedbaed704010a8fef256e5ec9b90ef95f2e77d9cd
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ac15faca44126ea757af3cc9233a4970a99a30bf6b2f36cfb0d4ae9816273ed
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7113821138211383,
6
  "eval_steps": 500,
7
- "global_step": 1400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -204,6 +204,34 @@
204
  "learning_rate": 1.60643704121965e-05,
205
  "loss": 0.486,
206
  "step": 1400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
207
  }
208
  ],
209
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.8130081300813008,
6
  "eval_steps": 500,
7
+ "global_step": 1600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
204
  "learning_rate": 1.60643704121965e-05,
205
  "loss": 0.486,
206
  "step": 1400
207
+ },
208
+ {
209
+ "epoch": 0.7367886178861789,
210
+ "grad_norm": 1.7265625,
211
+ "learning_rate": 1.4652738565782046e-05,
212
+ "loss": 0.4875,
213
+ "step": 1450
214
+ },
215
+ {
216
+ "epoch": 0.7621951219512195,
217
+ "grad_norm": 1.9921875,
218
+ "learning_rate": 1.3241106719367592e-05,
219
+ "loss": 0.4874,
220
+ "step": 1500
221
+ },
222
+ {
223
+ "epoch": 0.7876016260162602,
224
+ "grad_norm": 1.796875,
225
+ "learning_rate": 1.1829474872953134e-05,
226
+ "loss": 0.4725,
227
+ "step": 1550
228
+ },
229
+ {
230
+ "epoch": 0.8130081300813008,
231
+ "grad_norm": 1.8359375,
232
+ "learning_rate": 1.0417843026538679e-05,
233
+ "loss": 0.4819,
234
+ "step": 1600
235
  }
236
  ],
237
  "logging_steps": 50,