guyhadad01 commited on
Commit
6be46e8
·
verified ·
1 Parent(s): c85c93b

Training in progress, step 600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -466,9 +466,9 @@ print(embeddings.shape)
466
  # Get the similarity scores for the embeddings
467
  similarities = model.similarity(embeddings, embeddings)
468
  print(similarities)
469
- # tensor([[ 1.0000, 0.5340, -0.0489],
470
- # [ 0.5340, 1.0000, -0.0623],
471
- # [-0.0489, -0.0623, 1.0000]])
472
  ```
473
 
474
  <!--
@@ -684,6 +684,10 @@ You can finetune this model on your own dataset.
684
  | 0.1524 | 300 | 0.5898 |
685
  | 0.1778 | 350 | 0.5569 |
686
  | 0.2033 | 400 | 0.5396 |
 
 
 
 
687
 
688
 
689
  ### Framework Versions
 
466
  # Get the similarity scores for the embeddings
467
  similarities = model.similarity(embeddings, embeddings)
468
  print(similarities)
469
+ # tensor([[ 1.0000, 0.5416, -0.0529],
470
+ # [ 0.5416, 1.0000, -0.0571],
471
+ # [-0.0529, -0.0571, 1.0000]])
472
  ```
473
 
474
  <!--
 
684
  | 0.1524 | 300 | 0.5898 |
685
  | 0.1778 | 350 | 0.5569 |
686
  | 0.2033 | 400 | 0.5396 |
687
+ | 0.2287 | 450 | 0.5298 |
688
+ | 0.2541 | 500 | 0.5257 |
689
+ | 0.2795 | 550 | 0.5151 |
690
+ | 0.3049 | 600 | 0.5239 |
691
 
692
 
693
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ebaadd7ca69549d21e0a9b5a198c58e5df0a12a58aa56635196f10c545d2363b
3
  size 45437864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db180de14ad34af5b594eb81db91a48a3f45d6d9dcd3f719d2c809d54b9b71a5
3
  size 45437864
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8a26a7a0f56cd6950e1e3ae0ec3c0412ad0bcebd9c3dfa88f2162b4a3e97528
3
  size 90346763
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e101e09cac9abb18af92e11a5aad1671259c0532e03955910cff367b721b16d8
3
  size 90346763
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4865ec8a72ed85ad9518ab1ebb67049ddc164edcb9400bda4e9e54f2cabcece1
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ee89ff3a386fc330c8001091c3d124cf617c5bfb2fe56bc351034ede547ca47
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8fc56140e5c37825482a26f377f07f74eaa4028a1b2f8b46eaa880f0215c9abf
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7eb57b4b6586ca069ba10818f8421f503ffe2fcc4027df0b3bf8a2421cac2a7
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.2032520325203252,
6
  "eval_steps": 500,
7
- "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -64,6 +64,34 @@
64
  "learning_rate": 4.42970073404856e-05,
65
  "loss": 0.5396,
66
  "step": 400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
67
  }
68
  ],
69
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.3048780487804878,
6
  "eval_steps": 500,
7
+ "global_step": 600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
64
  "learning_rate": 4.42970073404856e-05,
65
  "loss": 0.5396,
66
  "step": 400
67
+ },
68
+ {
69
+ "epoch": 0.22865853658536586,
70
+ "grad_norm": 1.796875,
71
+ "learning_rate": 4.288537549407115e-05,
72
+ "loss": 0.5298,
73
+ "step": 450
74
+ },
75
+ {
76
+ "epoch": 0.2540650406504065,
77
+ "grad_norm": 1.859375,
78
+ "learning_rate": 4.147374364765669e-05,
79
+ "loss": 0.5257,
80
+ "step": 500
81
+ },
82
+ {
83
+ "epoch": 0.27947154471544716,
84
+ "grad_norm": 1.84375,
85
+ "learning_rate": 4.006211180124224e-05,
86
+ "loss": 0.5151,
87
+ "step": 550
88
+ },
89
+ {
90
+ "epoch": 0.3048780487804878,
91
+ "grad_norm": 1.828125,
92
+ "learning_rate": 3.8650479954827784e-05,
93
+ "loss": 0.5239,
94
+ "step": 600
95
  }
96
  ],
97
  "logging_steps": 50,