guyhadad01 commited on
Commit
6ebe74e
·
verified ·
1 Parent(s): 0c691bf

Training in progress, step 800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -466,9 +466,9 @@ print(embeddings.shape)
466
  # Get the similarity scores for the embeddings
467
  similarities = model.similarity(embeddings, embeddings)
468
  print(similarities)
469
- # tensor([[ 1.0000, 0.5416, -0.0529],
470
- # [ 0.5416, 1.0000, -0.0571],
471
- # [-0.0529, -0.0571, 1.0000]])
472
  ```
473
 
474
  <!--
@@ -688,6 +688,10 @@ You can finetune this model on your own dataset.
688
  | 0.2541 | 500 | 0.5257 |
689
  | 0.2795 | 550 | 0.5151 |
690
  | 0.3049 | 600 | 0.5239 |
 
 
 
 
691
 
692
 
693
  ### Framework Versions
 
466
  # Get the similarity scores for the embeddings
467
  similarities = model.similarity(embeddings, embeddings)
468
  print(similarities)
469
+ # tensor([[ 1.0000, 0.5419, -0.0536],
470
+ # [ 0.5419, 1.0000, -0.0603],
471
+ # [-0.0536, -0.0603, 1.0000]])
472
  ```
473
 
474
  <!--
 
688
  | 0.2541 | 500 | 0.5257 |
689
  | 0.2795 | 550 | 0.5151 |
690
  | 0.3049 | 600 | 0.5239 |
691
+ | 0.3303 | 650 | 0.5169 |
692
+ | 0.3557 | 700 | 0.4942 |
693
+ | 0.3811 | 750 | 0.4981 |
694
+ | 0.4065 | 800 | 0.4983 |
695
 
696
 
697
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db180de14ad34af5b594eb81db91a48a3f45d6d9dcd3f719d2c809d54b9b71a5
3
  size 45437864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c83389a56acb41d0a1917c61a6404affa2f39e3aea8c2d79163946b220cb15ea
3
  size 45437864
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e101e09cac9abb18af92e11a5aad1671259c0532e03955910cff367b721b16d8
3
  size 90346763
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7c5ce4a9c10d4eddde5fcecaa6f889d2244e95913f07ab978ddb77e2cd0092b
3
  size 90346763
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ee89ff3a386fc330c8001091c3d124cf617c5bfb2fe56bc351034ede547ca47
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f142a1fe70eca00a55d0386edee20a5cc0cc4371069ed8cc8489431723b0160c
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7eb57b4b6586ca069ba10818f8421f503ffe2fcc4027df0b3bf8a2421cac2a7
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79cf700515bb029e36ca46412b96b02750cd1dce66cb44278ee1c691b7d1aa79
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.3048780487804878,
6
  "eval_steps": 500,
7
- "global_step": 600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -92,6 +92,34 @@
92
  "learning_rate": 3.8650479954827784e-05,
93
  "loss": 0.5239,
94
  "step": 600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
95
  }
96
  ],
97
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.4065040650406504,
6
  "eval_steps": 500,
7
+ "global_step": 800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
92
  "learning_rate": 3.8650479954827784e-05,
93
  "loss": 0.5239,
94
  "step": 600
95
+ },
96
+ {
97
+ "epoch": 0.33028455284552843,
98
+ "grad_norm": 1.8828125,
99
+ "learning_rate": 3.7238848108413324e-05,
100
+ "loss": 0.5169,
101
+ "step": 650
102
+ },
103
+ {
104
+ "epoch": 0.3556910569105691,
105
+ "grad_norm": 1.8359375,
106
+ "learning_rate": 3.5827216261998877e-05,
107
+ "loss": 0.4942,
108
+ "step": 700
109
+ },
110
+ {
111
+ "epoch": 0.38109756097560976,
112
+ "grad_norm": 1.9921875,
113
+ "learning_rate": 3.4415584415584416e-05,
114
+ "loss": 0.4981,
115
+ "step": 750
116
+ },
117
+ {
118
+ "epoch": 0.4065040650406504,
119
+ "grad_norm": 1.7578125,
120
+ "learning_rate": 3.300395256916996e-05,
121
+ "loss": 0.4983,
122
+ "step": 800
123
  }
124
  ],
125
  "logging_steps": 50,