guyhadad01 commited on
Commit
b2c8b7c
·
verified ·
1 Parent(s): d9719e9

Training in progress, step 400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -466,9 +466,9 @@ print(embeddings.shape)
466
  # Get the similarity scores for the embeddings
467
  similarities = model.similarity(embeddings, embeddings)
468
  print(similarities)
469
- # tensor([[ 1.0000, 0.4864, -0.0477],
470
- # [ 0.4864, 1.0000, -0.0628],
471
- # [-0.0477, -0.0628, 1.0000]])
472
  ```
473
 
474
  <!--
@@ -680,6 +680,10 @@ You can finetune this model on your own dataset.
680
  | 0.0508 | 100 | 0.9886 |
681
  | 0.0762 | 150 | 0.7345 |
682
  | 0.1016 | 200 | 0.6664 |
 
 
 
 
683
 
684
 
685
  ### Framework Versions
 
466
  # Get the similarity scores for the embeddings
467
  similarities = model.similarity(embeddings, embeddings)
468
  print(similarities)
469
+ # tensor([[ 1.0000, 0.5340, -0.0489],
470
+ # [ 0.5340, 1.0000, -0.0623],
471
+ # [-0.0489, -0.0623, 1.0000]])
472
  ```
473
 
474
  <!--
 
680
  | 0.0508 | 100 | 0.9886 |
681
  | 0.0762 | 150 | 0.7345 |
682
  | 0.1016 | 200 | 0.6664 |
683
+ | 0.1270 | 250 | 0.6045 |
684
+ | 0.1524 | 300 | 0.5898 |
685
+ | 0.1778 | 350 | 0.5569 |
686
+ | 0.2033 | 400 | 0.5396 |
687
 
688
 
689
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f9cd66af2df3d93b44a7be9da35e1c72b158bddbc6dca683583cea252dd21ad
3
  size 45437864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebaadd7ca69549d21e0a9b5a198c58e5df0a12a58aa56635196f10c545d2363b
3
  size 45437864
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce2ceafe399e0f67b7e02eadf72ed444135de3040ff7b41718e7e5c2b1b4379b
3
  size 90346763
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8a26a7a0f56cd6950e1e3ae0ec3c0412ad0bcebd9c3dfa88f2162b4a3e97528
3
  size 90346763
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:193ad77f0728afe0c1206dffe24ec29d395eeee0f88a01a3b5ee926dada4548f
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4865ec8a72ed85ad9518ab1ebb67049ddc164edcb9400bda4e9e54f2cabcece1
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d4e739551319e957e6c472fd8c9bacf3bae41231a764211a8f19abc4bae6961
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fc56140e5c37825482a26f377f07f74eaa4028a1b2f8b46eaa880f0215c9abf
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.1016260162601626,
6
  "eval_steps": 500,
7
- "global_step": 200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -36,6 +36,34 @@
36
  "learning_rate": 4.994353472614343e-05,
37
  "loss": 0.6664,
38
  "step": 200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
39
  }
40
  ],
41
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.2032520325203252,
6
  "eval_steps": 500,
7
+ "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
36
  "learning_rate": 4.994353472614343e-05,
37
  "loss": 0.6664,
38
  "step": 200
39
+ },
40
+ {
41
+ "epoch": 0.12703252032520326,
42
+ "grad_norm": 2.078125,
43
+ "learning_rate": 4.853190287972897e-05,
44
+ "loss": 0.6045,
45
+ "step": 250
46
+ },
47
+ {
48
+ "epoch": 0.1524390243902439,
49
+ "grad_norm": 2.046875,
50
+ "learning_rate": 4.7120271033314515e-05,
51
+ "loss": 0.5898,
52
+ "step": 300
53
+ },
54
+ {
55
+ "epoch": 0.17784552845528456,
56
+ "grad_norm": 1.6875,
57
+ "learning_rate": 4.570863918690006e-05,
58
+ "loss": 0.5569,
59
+ "step": 350
60
+ },
61
+ {
62
+ "epoch": 0.2032520325203252,
63
+ "grad_norm": 1.9765625,
64
+ "learning_rate": 4.42970073404856e-05,
65
+ "loss": 0.5396,
66
+ "step": 400
67
  }
68
  ],
69
  "logging_steps": 50,