rabaevn commited on
Commit
d699bff
·
verified ·
1 Parent(s): c5cb20b

Training in progress, step 1400, checkpoint

Browse files
last-checkpoint/2_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13c09a5e85744071f43b660f276c30dd0c78a002e829d09339df6553d68e5e9c
3
  size 9437272
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14549a8f2b505a8545ac674725066f9c305d15592336942bb065ad4f6ddeb306
3
  size 9437272
last-checkpoint/3_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9bce4267c7916e7b1d39e730977890918f472a20904f7cdb5c6470b3bb959efc
3
  size 9437272
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0952aa81b7cdd3daf666c37d0854e5bff5e7a14e28b4874444f7772caeb46f9d
3
  size 9437272
last-checkpoint/README.md CHANGED
@@ -450,7 +450,7 @@ print(query_embeddings.shape, document_embeddings.shape)
450
  # Get the similarity scores for the embeddings
451
  similarities = model.similarity(query_embeddings, document_embeddings)
452
  print(similarities)
453
- # tensor([[ 0.6289, -0.0545, 0.2478]])
454
  ```
455
 
456
  <!--
@@ -711,6 +711,10 @@ You can finetune this model on your own dataset.
711
  | 0.3640 | 1100 | 0.091 |
712
  | 0.3805 | 1150 | 0.0802 |
713
  | 0.3971 | 1200 | 0.0824 |
 
 
 
 
714
 
715
 
716
  ### Framework Versions
 
450
  # Get the similarity scores for the embeddings
451
  similarities = model.similarity(query_embeddings, document_embeddings)
452
  print(similarities)
453
+ # tensor([[ 0.6231, -0.0744, 0.1279]])
454
  ```
455
 
456
  <!--
 
711
  | 0.3640 | 1100 | 0.091 |
712
  | 0.3805 | 1150 | 0.0802 |
713
  | 0.3971 | 1200 | 0.0824 |
714
+ | 0.4136 | 1250 | 0.0845 |
715
+ | 0.4302 | 1300 | 0.09 |
716
+ | 0.4467 | 1350 | 0.0866 |
717
+ | 0.4633 | 1400 | 0.0826 |
718
 
719
 
720
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba9d8f01d2057279be1dd562ae68b04fc16b9056d28e910d54d2259bf7168206
3
  size 1211486072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:477457ae6906b9786bffa8dd6309187edd28e664410a059cfffacf1f2cae3bc6
3
  size 1211486072
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:763bdcee7c6c388f0295a0946aba7ea97cd1965328c61b7d56cab32345452a48
3
  size 2460923467
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fcb82c0030f2e69a729cae162131808daef058010082ee7c6a1cdc5a1109b47
3
  size 2460923467
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c53cf553f6434449959e590b32ad22ac0c6e07ffae962a4164d31ea3a75d345e
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fcfe456f41c489958b10f637ef851405e803e7363ed9925c3152e6d7cebd14a
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:781bdd0549418e8b91230f3cd2918472966507e472c42f0916b387b617b2e59a
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1807d5c010828dc5af6863500632317772ab24748d2f2f3dc9b74b307531f182
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.3970880211780278,
6
  "eval_steps": 500,
7
- "global_step": 1200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -176,6 +176,34 @@
176
  "learning_rate": 1.3409341669731519e-05,
177
  "loss": 0.0824,
178
  "step": 1200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
179
  }
180
  ],
181
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.4632693580410324,
6
  "eval_steps": 500,
7
+ "global_step": 1400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
176
  "learning_rate": 1.3409341669731519e-05,
177
  "loss": 0.0824,
178
  "step": 1200
179
+ },
180
+ {
181
+ "epoch": 0.41363335539377893,
182
+ "grad_norm": 2.9681406021118164,
183
+ "learning_rate": 1.3041559396837074e-05,
184
+ "loss": 0.0845,
185
+ "step": 1250
186
+ },
187
+ {
188
+ "epoch": 0.4301786896095301,
189
+ "grad_norm": 6.426875591278076,
190
+ "learning_rate": 1.2673777123942627e-05,
191
+ "loss": 0.09,
192
+ "step": 1300
193
+ },
194
+ {
195
+ "epoch": 0.44672402382528126,
196
+ "grad_norm": 8.284296035766602,
197
+ "learning_rate": 1.2305994851048179e-05,
198
+ "loss": 0.0866,
199
+ "step": 1350
200
+ },
201
+ {
202
+ "epoch": 0.4632693580410324,
203
+ "grad_norm": 5.250367164611816,
204
+ "learning_rate": 1.1938212578153734e-05,
205
+ "loss": 0.0826,
206
+ "step": 1400
207
  }
208
  ],
209
  "logging_steps": 50,