guyhadad01 commited on
Commit
416fb4f
·
verified ·
1 Parent(s): 3b87fc7

Training in progress, step 1968, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -466,9 +466,9 @@ print(embeddings.shape)
466
  # Get the similarity scores for the embeddings
467
  similarities = model.similarity(embeddings, embeddings)
468
  print(similarities)
469
- # tensor([[ 1.0000, 0.5466, -0.0454],
470
- # [ 0.5466, 1.0000, -0.0568],
471
- # [-0.0454, -0.0568, 1.0000]])
472
  ```
473
 
474
  <!--
@@ -712,6 +712,9 @@ You can finetune this model on your own dataset.
712
  | 0.8638 | 1700 | 0.4797 |
713
  | 0.8892 | 1750 | 0.4836 |
714
  | 0.9146 | 1800 | 0.4832 |
 
 
 
715
 
716
 
717
  ### Framework Versions
 
466
  # Get the similarity scores for the embeddings
467
  similarities = model.similarity(embeddings, embeddings)
468
  print(similarities)
469
+ # tensor([[ 1.0000, 0.5476, -0.0452],
470
+ # [ 0.5476, 1.0000, -0.0572],
471
+ # [-0.0452, -0.0572, 1.0000]])
472
  ```
473
 
474
  <!--
 
712
  | 0.8638 | 1700 | 0.4797 |
713
  | 0.8892 | 1750 | 0.4836 |
714
  | 0.9146 | 1800 | 0.4832 |
715
+ | 0.9400 | 1850 | 0.4945 |
716
+ | 0.9654 | 1900 | 0.4686 |
717
+ | 0.9909 | 1950 | 0.4889 |
718
 
719
 
720
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17554aba416dac32662ee4493f2bcaa68570b7683a6b8940eb5d0031827f3358
3
  size 45437864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9080ef7277f0217e3fcbbed443d4e5ddc988fbc3584f2d4e802ff68df0a7bdac
3
  size 45437864
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c7df775c39fa3b71bbba8fbfd34191533c8b284b769351bdb0714a10d07e26c
3
  size 90346763
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27d3829e1ab12246a2cf294916488e1316baa979819e854e9daf959d2b57cba6
3
  size 90346763
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4383e099fde8143073bc583376ee59e15bec296ef152a2f16e0f5296290e06e4
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbb5e9a64c60aa1634b1d1197ab20d54415e7d3be09731170c25ff71a460e2a5
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec29327b2c793ef05a01c6bae10cd1cf49d3fd34bb421765aad2d8f09bc372c0
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04e88cb3830f9a985bd7f6d2cca6f569425345d84761a9b2c6e58dd048cd58e3
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.9146341463414634,
6
  "eval_steps": 500,
7
- "global_step": 1800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -260,6 +260,27 @@
260
  "learning_rate": 4.771315640880859e-06,
261
  "loss": 0.4832,
262
  "step": 1800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
263
  }
264
  ],
265
  "logging_steps": 50,
@@ -274,7 +295,7 @@
274
  "should_evaluate": false,
275
  "should_log": false,
276
  "should_save": true,
277
- "should_training_stop": false
278
  },
279
  "attributes": {}
280
  }
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 1.0,
6
  "eval_steps": 500,
7
+ "global_step": 1968,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
260
  "learning_rate": 4.771315640880859e-06,
261
  "loss": 0.4832,
262
  "step": 1800
263
+ },
264
+ {
265
+ "epoch": 0.9400406504065041,
266
+ "grad_norm": 1.859375,
267
+ "learning_rate": 3.3596837944664035e-06,
268
+ "loss": 0.4945,
269
+ "step": 1850
270
+ },
271
+ {
272
+ "epoch": 0.9654471544715447,
273
+ "grad_norm": 1.6640625,
274
+ "learning_rate": 1.948051948051948e-06,
275
+ "loss": 0.4686,
276
+ "step": 1900
277
+ },
278
+ {
279
+ "epoch": 0.9908536585365854,
280
+ "grad_norm": 1.796875,
281
+ "learning_rate": 5.364201016374929e-07,
282
+ "loss": 0.4889,
283
+ "step": 1950
284
  }
285
  ],
286
  "logging_steps": 50,
 
295
  "should_evaluate": false,
296
  "should_log": false,
297
  "should_save": true,
298
+ "should_training_stop": true
299
  },
300
  "attributes": {}
301
  }