guyhadad01 commited on
Commit
caf19fa
·
verified ·
1 Parent(s): 86dbd8a

Training in progress, step 1200, checkpoint

Browse files
last-checkpoint/2_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b6c776b093b837b0cfe9d25fef404f3dee032b8cafb171d812cfd30cd885e3b
3
  size 4718680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a2189eb62627bdac98795adf703b4963d7bb5806a18140f0705bd0846bdcb81
3
  size 4718680
last-checkpoint/3_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70807611011deb9d648984e4201362594f4128f2399b18fb763a243b933061ba
3
  size 4718680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ec50e543099a6bb0c1f8e5fdd57d0d9e86ebe7e6b5160cc004a39d435e0eea0
3
  size 4718680
last-checkpoint/README.md CHANGED
@@ -472,7 +472,7 @@ print(query_embeddings.shape, document_embeddings.shape)
472
  # Get the similarity scores for the embeddings
473
  similarities = model.similarity(query_embeddings, document_embeddings)
474
  print(similarities)
475
- # tensor([[ 0.6607, -0.0923, -0.0703]])
476
  ```
477
 
478
  <!--
@@ -701,6 +701,10 @@ You can finetune this model on your own dataset.
701
  | 0.4573 | 900 | 0.111 |
702
  | 0.4827 | 950 | 0.1163 |
703
  | 0.5081 | 1000 | 0.1133 |
 
 
 
 
704
 
705
 
706
  ### Framework Versions
 
472
  # Get the similarity scores for the embeddings
473
  similarities = model.similarity(query_embeddings, document_embeddings)
474
  print(similarities)
475
+ # tensor([[ 0.7396, -0.0637, -0.0765]])
476
  ```
477
 
478
  <!--
 
701
  | 0.4573 | 900 | 0.111 |
702
  | 0.4827 | 950 | 0.1163 |
703
  | 0.5081 | 1000 | 0.1133 |
704
+ | 0.5335 | 1050 | 0.1008 |
705
+ | 0.5589 | 1100 | 0.1075 |
706
+ | 0.5843 | 1150 | 0.0994 |
707
+ | 0.6098 | 1200 | 0.0911 |
708
 
709
 
710
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d73d930444c3a62a922f022e9b1dd8c90fa0101e0f9d6a5b5e7b445f20cc9f4c
3
  size 605759848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f10ebdd6d376d88b30ef3bdc290fee724cdcdb9834c31657cb9b7e697616ef0b
3
  size 605759848
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1c2b36aa1ed8b386c5ed3b537cdf298144b552b7011463c205e695056f73f6e
3
  size 1230592267
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92bc90f9a7af2adcce32e0343802524c333d41bf01c18a9ae80cb07c5024b317
3
  size 1230592267
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab6c56263d0a3d675d4f747bb77db752789302abc7e0c5864efa40f605c0194a
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8e232785d1786cb94e8889d9a79973e568b9bfb82c9ff8f8a12783934ff997c
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.508130081300813,
6
  "eval_steps": 500,
7
- "global_step": 1000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -148,6 +148,34 @@
148
  "learning_rate": 2.7357425183512143e-05,
149
  "loss": 0.1133,
150
  "step": 1000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
151
  }
152
  ],
153
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.6097560975609756,
6
  "eval_steps": 500,
7
+ "global_step": 1200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
148
  "learning_rate": 2.7357425183512143e-05,
149
  "loss": 0.1133,
150
  "step": 1000
151
+ },
152
+ {
153
+ "epoch": 0.5335365853658537,
154
+ "grad_norm": 3.34375,
155
+ "learning_rate": 2.5945793337097685e-05,
156
+ "loss": 0.1008,
157
+ "step": 1050
158
+ },
159
+ {
160
+ "epoch": 0.5589430894308943,
161
+ "grad_norm": 3.890625,
162
+ "learning_rate": 2.453416149068323e-05,
163
+ "loss": 0.1075,
164
+ "step": 1100
165
+ },
166
+ {
167
+ "epoch": 0.584349593495935,
168
+ "grad_norm": 3.6875,
169
+ "learning_rate": 2.3122529644268774e-05,
170
+ "loss": 0.0994,
171
+ "step": 1150
172
+ },
173
+ {
174
+ "epoch": 0.6097560975609756,
175
+ "grad_norm": 2.609375,
176
+ "learning_rate": 2.171089779785432e-05,
177
+ "loss": 0.0911,
178
+ "step": 1200
179
  }
180
  ],
181
  "logging_steps": 50,