guyhadad01 commited on
Commit
a91119d
·
verified ·
1 Parent(s): e835d84

Training in progress, step 600, checkpoint

Browse files
last-checkpoint/2_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8385504144ad50228e1459ea5b1da17bd7f4d3aac19f5476c1c8296b68f4f05b
3
  size 4718680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27c35bbbe0b3b4648d206a86b9a22ed14cdd5ba12f681b9329d51cc3594ed874
3
  size 4718680
last-checkpoint/3_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac472c212bf6ebd5d336507924eb651104467de24dfbfaa520db97b7708d09b9
3
  size 4718680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4cec3b48c616eb4b62540bb0ef79466b8968a49111b3b79390a007de3e0f383
3
  size 4718680
last-checkpoint/README.md CHANGED
@@ -472,7 +472,7 @@ print(query_embeddings.shape, document_embeddings.shape)
472
  # Get the similarity scores for the embeddings
473
  similarities = model.similarity(query_embeddings, document_embeddings)
474
  print(similarities)
475
- # tensor([[ 0.5851, -0.1180, -0.1336]])
476
  ```
477
 
478
  <!--
@@ -689,6 +689,10 @@ You can finetune this model on your own dataset.
689
  | 0.1524 | 300 | 0.2123 |
690
  | 0.1778 | 350 | 0.186 |
691
  | 0.2033 | 400 | 0.1693 |
 
 
 
 
692
 
693
 
694
  ### Framework Versions
 
472
  # Get the similarity scores for the embeddings
473
  similarities = model.similarity(query_embeddings, document_embeddings)
474
  print(similarities)
475
+ # tensor([[ 0.6778, -0.0608, -0.0575]])
476
  ```
477
 
478
  <!--
 
689
  | 0.1524 | 300 | 0.2123 |
690
  | 0.1778 | 350 | 0.186 |
691
  | 0.2033 | 400 | 0.1693 |
692
+ | 0.2287 | 450 | 0.1645 |
693
+ | 0.2541 | 500 | 0.1625 |
694
+ | 0.2795 | 550 | 0.1496 |
695
+ | 0.3049 | 600 | 0.1443 |
696
 
697
 
698
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5538ec5f6c8499fe8ef0de1e93c420e403b0b4f926f25aa62e05b6f0e23991b0
3
  size 605759848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc1843a41fe2dd32d660c15e8784bd2856c6414131db4c135fd8dff36f2c1ad8
3
  size 605759848
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd9addc9d33db5aa5f32bbfd79d0f8ab2168d1aa307bb30b7aa8355f331a85fd
3
  size 1230592267
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dc4a0287e603c73e34c64d56fe7746287894b2e986c2ef471e4e5419ebf89b5
3
  size 1230592267
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8fc56140e5c37825482a26f377f07f74eaa4028a1b2f8b46eaa880f0215c9abf
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7eb57b4b6586ca069ba10818f8421f503ffe2fcc4027df0b3bf8a2421cac2a7
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.2032520325203252,
6
  "eval_steps": 500,
7
- "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -64,6 +64,34 @@
64
  "learning_rate": 4.42970073404856e-05,
65
  "loss": 0.1693,
66
  "step": 400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
67
  }
68
  ],
69
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.3048780487804878,
6
  "eval_steps": 500,
7
+ "global_step": 600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
64
  "learning_rate": 4.42970073404856e-05,
65
  "loss": 0.1693,
66
  "step": 400
67
+ },
68
+ {
69
+ "epoch": 0.22865853658536586,
70
+ "grad_norm": 5.75,
71
+ "learning_rate": 4.288537549407115e-05,
72
+ "loss": 0.1645,
73
+ "step": 450
74
+ },
75
+ {
76
+ "epoch": 0.2540650406504065,
77
+ "grad_norm": 4.21875,
78
+ "learning_rate": 4.147374364765669e-05,
79
+ "loss": 0.1625,
80
+ "step": 500
81
+ },
82
+ {
83
+ "epoch": 0.27947154471544716,
84
+ "grad_norm": 3.984375,
85
+ "learning_rate": 4.006211180124224e-05,
86
+ "loss": 0.1496,
87
+ "step": 550
88
+ },
89
+ {
90
+ "epoch": 0.3048780487804878,
91
+ "grad_norm": 3.625,
92
+ "learning_rate": 3.8650479954827784e-05,
93
+ "loss": 0.1443,
94
+ "step": 600
95
  }
96
  ],
97
  "logging_steps": 50,