guyhadad01 commited on
Commit
22413ba
·
verified ·
1 Parent(s): 0a5413a

Training in progress, step 4600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -286,9 +286,9 @@ print(embeddings.shape)
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
- # tensor([[1.0000, 0.5709, 0.1243],
290
- # [0.5709, 1.0000, 0.1388],
291
- # [0.1243, 0.1388, 1.0000]])
292
  ```
293
 
294
  <!--
@@ -1312,6 +1312,10 @@ You can finetune this model on your own dataset.
1312
  | 0.0760 | 4300 | 0.4779 |
1313
  | 0.0769 | 4350 | 0.4463 |
1314
  | 0.0778 | 4400 | 0.4917 |
 
 
 
 
1315
 
1316
 
1317
  ### Framework Versions
 
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
+ # tensor([[1.0000, 0.6246, 0.1173],
290
+ # [0.6246, 1.0000, 0.1638],
291
+ # [0.1173, 0.1638, 1.0000]])
292
  ```
293
 
294
  <!--
 
1312
  | 0.0760 | 4300 | 0.4779 |
1313
  | 0.0769 | 4350 | 0.4463 |
1314
  | 0.0778 | 4400 | 0.4917 |
1315
+ | 0.0786 | 4450 | 0.5572 |
1316
+ | 0.0795 | 4500 | 0.4553 |
1317
+ | 0.0804 | 4550 | 0.4598 |
1318
+ | 0.0813 | 4600 | 0.5445 |
1319
 
1320
 
1321
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28ab5af774c8b92f73b8b0edbc8679fe71ea4dfe39546414176fa364cb641370
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8de4e67c75f4b4a7427b2810b985973120199b61a5e131a31184941440675588
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f00d4b90b013eb15ec92f6d8f7effe9c310c62760f7a18e7788ea316eefca59
3
  size 180609611
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a2de7647e7106c94dd0498982cecf5e23bcd6cc4a2d106abd4e0a67ed761131
3
  size 180609611
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bb2a47368e57ccb8578c1be62d33027ebea1fe6bd63bffa18038620abaa273d0
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0c125bd90db08e6be99cb0172e0d523e9ccee0b8234c431ef93a30e9252f3b6
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa01c0faab1a39c11ceba075e1e73b81a5689cfd1ac0d27ee7fece150d320be6
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d5f1d0b668240e318afe61a3e255204044d52e6d78b98d08469e3aaa3293711
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:02cdb9f646b45dd98fa4d4f96eec0334a5b44f90a00b9690154aab22c0f05613
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c485dc831eee1163015670289f311918797d3da6236e5f584fb1d2dbee1714b9
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.07775087911505363,
6
  "eval_steps": 500,
7
- "global_step": 4400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -624,6 +624,34 @@
624
  "learning_rate": 3.8860424028268556e-05,
625
  "loss": 0.4917,
626
  "step": 4400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
627
  }
628
  ],
629
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.0812850099839197,
6
  "eval_steps": 500,
7
+ "global_step": 4600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
624
  "learning_rate": 3.8860424028268556e-05,
625
  "loss": 0.4917,
626
  "step": 4400
627
+ },
628
+ {
629
+ "epoch": 0.07863441183227014,
630
+ "grad_norm": 5.889612197875977,
631
+ "learning_rate": 3.930212014134276e-05,
632
+ "loss": 0.5572,
633
+ "step": 4450
634
+ },
635
+ {
636
+ "epoch": 0.07951794454948667,
637
+ "grad_norm": 2.7529609203338623,
638
+ "learning_rate": 3.9743816254416965e-05,
639
+ "loss": 0.4553,
640
+ "step": 4500
641
+ },
642
+ {
643
+ "epoch": 0.08040147726670319,
644
+ "grad_norm": 2.4175944328308105,
645
+ "learning_rate": 4.018551236749117e-05,
646
+ "loss": 0.4598,
647
+ "step": 4550
648
+ },
649
+ {
650
+ "epoch": 0.0812850099839197,
651
+ "grad_norm": 2.2330217361450195,
652
+ "learning_rate": 4.0627208480565374e-05,
653
+ "loss": 0.5445,
654
+ "step": 4600
655
  }
656
  ],
657
  "logging_steps": 50,