guyhadad01 commited on
Commit
d636c17
·
verified ·
1 Parent(s): f40fcde

Training in progress, step 4400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -286,9 +286,9 @@ print(embeddings.shape)
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
- # tensor([[1.0000, 0.6197, 0.0899],
290
- # [0.6197, 1.0000, 0.1018],
291
- # [0.0899, 0.1018, 1.0000]])
292
  ```
293
 
294
  <!--
@@ -1308,6 +1308,10 @@ You can finetune this model on your own dataset.
1308
  | 0.0724 | 4100 | 0.4755 |
1309
  | 0.0733 | 4150 | 0.4897 |
1310
  | 0.0742 | 4200 | 0.4679 |
 
 
 
 
1311
 
1312
 
1313
  ### Framework Versions
 
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
+ # tensor([[1.0000, 0.5709, 0.1243],
290
+ # [0.5709, 1.0000, 0.1388],
291
+ # [0.1243, 0.1388, 1.0000]])
292
  ```
293
 
294
  <!--
 
1308
  | 0.0724 | 4100 | 0.4755 |
1309
  | 0.0733 | 4150 | 0.4897 |
1310
  | 0.0742 | 4200 | 0.4679 |
1311
+ | 0.0751 | 4250 | 0.4712 |
1312
+ | 0.0760 | 4300 | 0.4779 |
1313
+ | 0.0769 | 4350 | 0.4463 |
1314
+ | 0.0778 | 4400 | 0.4917 |
1315
 
1316
 
1317
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6edbab9b964e9ca7b0bab9e7c4f66e7e7bc86ba965571aa4d27edf17e6ee9ae
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28ab5af774c8b92f73b8b0edbc8679fe71ea4dfe39546414176fa364cb641370
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49ef51099777f465890db4e01e4666b0ea051323d10a6459c3da580d7d661a3c
3
  size 180609611
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f00d4b90b013eb15ec92f6d8f7effe9c310c62760f7a18e7788ea316eefca59
3
  size 180609611
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6b1fbe40a2f2e085bd8df80fdc83132b78dd273708a845bf0221a8bf75df21c
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb2a47368e57ccb8578c1be62d33027ebea1fe6bd63bffa18038620abaa273d0
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0563f0c122c10b3bb9fb8ef7a029cf4fe15b88c3307945ff50155d3485ee7edd
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa01c0faab1a39c11ceba075e1e73b81a5689cfd1ac0d27ee7fece150d320be6
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77c82cc641eba2e585eb912c19a748e90231d19cc7c5365b3984d32e47cc490a
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02cdb9f646b45dd98fa4d4f96eec0334a5b44f90a00b9690154aab22c0f05613
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.07421674824618756,
6
  "eval_steps": 500,
7
- "global_step": 4200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -596,6 +596,34 @@
596
  "learning_rate": 3.709363957597173e-05,
597
  "loss": 0.4679,
598
  "step": 4200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
599
  }
600
  ],
601
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.07775087911505363,
6
  "eval_steps": 500,
7
+ "global_step": 4400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
596
  "learning_rate": 3.709363957597173e-05,
597
  "loss": 0.4679,
598
  "step": 4200
599
+ },
600
+ {
601
+ "epoch": 0.07510028096340407,
602
+ "grad_norm": 2.700162649154663,
603
+ "learning_rate": 3.7535335689045936e-05,
604
+ "loss": 0.4712,
605
+ "step": 4250
606
+ },
607
+ {
608
+ "epoch": 0.0759838136806206,
609
+ "grad_norm": 1.9648590087890625,
610
+ "learning_rate": 3.797703180212015e-05,
611
+ "loss": 0.4779,
612
+ "step": 4300
613
+ },
614
+ {
615
+ "epoch": 0.07686734639783711,
616
+ "grad_norm": 2.4238970279693604,
617
+ "learning_rate": 3.8418727915194345e-05,
618
+ "loss": 0.4463,
619
+ "step": 4350
620
+ },
621
+ {
622
+ "epoch": 0.07775087911505363,
623
+ "grad_norm": 1.745356798171997,
624
+ "learning_rate": 3.8860424028268556e-05,
625
+ "loss": 0.4917,
626
+ "step": 4400
627
  }
628
  ],
629
  "logging_steps": 50,