rabaevn commited on
Commit
8922bda
·
verified ·
1 Parent(s): df145c6

Training in progress, step 1600, checkpoint

Browse files
last-checkpoint/2_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14549a8f2b505a8545ac674725066f9c305d15592336942bb065ad4f6ddeb306
3
  size 9437272
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ef8c04b17ad19cb132ef20b5b1a1912424354dd87c3760dbafc1f82f4998feb
3
  size 9437272
last-checkpoint/3_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0952aa81b7cdd3daf666c37d0854e5bff5e7a14e28b4874444f7772caeb46f9d
3
  size 9437272
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b41b495d7e858c250a6b90039f9524914ea51d03a32937b352f996067227212d
3
  size 9437272
last-checkpoint/README.md CHANGED
@@ -450,7 +450,7 @@ print(query_embeddings.shape, document_embeddings.shape)
450
  # Get the similarity scores for the embeddings
451
  similarities = model.similarity(query_embeddings, document_embeddings)
452
  print(similarities)
453
- # tensor([[ 0.6231, -0.0744, 0.1279]])
454
  ```
455
 
456
  <!--
@@ -715,6 +715,10 @@ You can finetune this model on your own dataset.
715
  | 0.4302 | 1300 | 0.09 |
716
  | 0.4467 | 1350 | 0.0866 |
717
  | 0.4633 | 1400 | 0.0826 |
 
 
 
 
718
 
719
 
720
  ### Framework Versions
 
450
  # Get the similarity scores for the embeddings
451
  similarities = model.similarity(query_embeddings, document_embeddings)
452
  print(similarities)
453
+ # tensor([[ 0.5546, -0.0938, 0.1724]])
454
  ```
455
 
456
  <!--
 
715
  | 0.4302 | 1300 | 0.09 |
716
  | 0.4467 | 1350 | 0.0866 |
717
  | 0.4633 | 1400 | 0.0826 |
718
+ | 0.4798 | 1450 | 0.0735 |
719
+ | 0.4964 | 1500 | 0.0801 |
720
+ | 0.5129 | 1550 | 0.0694 |
721
+ | 0.5295 | 1600 | 0.0681 |
722
 
723
 
724
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:477457ae6906b9786bffa8dd6309187edd28e664410a059cfffacf1f2cae3bc6
3
  size 1211486072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01b4fd7c2f9f44ed46fd6caca70cf6aebe1f901b80125453289a207674ea6322
3
  size 1211486072
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6fcb82c0030f2e69a729cae162131808daef058010082ee7c6a1cdc5a1109b47
3
  size 2460923467
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d22bc43d0ea91abbc9c61e88421b8d7b9f75756021d1e9a3876bbcd9caea969
3
  size 2460923467
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3fcfe456f41c489958b10f637ef851405e803e7363ed9925c3152e6d7cebd14a
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0de07336841d438b92ac2af437c756d5b1eee4a3bd0fc209eb2ee92c1bfa99d5
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1807d5c010828dc5af6863500632317772ab24748d2f2f3dc9b74b307531f182
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5730fd993b5a94a8fdb013ee342013b2eea3ce6c8a5a4ded39a304962934fc3
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.4632693580410324,
6
  "eval_steps": 500,
7
- "global_step": 1400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -204,6 +204,34 @@
204
  "learning_rate": 1.1938212578153734e-05,
205
  "loss": 0.0826,
206
  "step": 1400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
207
  }
208
  ],
209
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.5294506949040371,
6
  "eval_steps": 500,
7
+ "global_step": 1600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
204
  "learning_rate": 1.1938212578153734e-05,
205
  "loss": 0.0826,
206
  "step": 1400
207
+ },
208
+ {
209
+ "epoch": 0.4798146922567836,
210
+ "grad_norm": 4.941124439239502,
211
+ "learning_rate": 1.1570430305259287e-05,
212
+ "loss": 0.0735,
213
+ "step": 1450
214
+ },
215
+ {
216
+ "epoch": 0.49636002647253474,
217
+ "grad_norm": 4.166671276092529,
218
+ "learning_rate": 1.120264803236484e-05,
219
+ "loss": 0.0801,
220
+ "step": 1500
221
+ },
222
+ {
223
+ "epoch": 0.5129053606882858,
224
+ "grad_norm": 4.212963581085205,
225
+ "learning_rate": 1.0834865759470394e-05,
226
+ "loss": 0.0694,
227
+ "step": 1550
228
+ },
229
+ {
230
+ "epoch": 0.5294506949040371,
231
+ "grad_norm": 4.659167766571045,
232
+ "learning_rate": 1.0467083486575949e-05,
233
+ "loss": 0.0681,
234
+ "step": 1600
235
  }
236
  ],
237
  "logging_steps": 50,