guyhadad01 commited on
Commit
420fabf
·
verified ·
1 Parent(s): 1e52d52

Training in progress, step 1200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -466,9 +466,9 @@ print(embeddings.shape)
466
  # Get the similarity scores for the embeddings
467
  similarities = model.similarity(embeddings, embeddings)
468
  print(similarities)
469
- # tensor([[ 1.0000, 0.5433, -0.0509],
470
- # [ 0.5433, 1.0000, -0.0602],
471
- # [-0.0509, -0.0602, 1.0000]])
472
  ```
473
 
474
  <!--
@@ -696,6 +696,10 @@ You can finetune this model on your own dataset.
696
  | 0.4573 | 900 | 0.4869 |
697
  | 0.4827 | 950 | 0.4898 |
698
  | 0.5081 | 1000 | 0.501 |
 
 
 
 
699
 
700
 
701
  ### Framework Versions
 
466
  # Get the similarity scores for the embeddings
467
  similarities = model.similarity(embeddings, embeddings)
468
  print(similarities)
469
+ # tensor([[ 1.0000, 0.5452, -0.0490],
470
+ # [ 0.5452, 1.0000, -0.0581],
471
+ # [-0.0490, -0.0581, 1.0000]])
472
  ```
473
 
474
  <!--
 
696
  | 0.4573 | 900 | 0.4869 |
697
  | 0.4827 | 950 | 0.4898 |
698
  | 0.5081 | 1000 | 0.501 |
699
+ | 0.5335 | 1050 | 0.4843 |
700
+ | 0.5589 | 1100 | 0.496 |
701
+ | 0.5843 | 1150 | 0.4878 |
702
+ | 0.6098 | 1200 | 0.4892 |
703
 
704
 
705
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2e1e9d5eff6c41809cc50c6c706e397f17bdefc78c905246322008dcb6296db
3
  size 45437864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6ccad225ace68dee6e0781e8e27901d71d7fa01d17d06a0b6e3fc454a5478e4
3
  size 45437864
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5dcbdfcd46b4c04eb85077625bdbae7131e652ba94a811efcd17b9990ba6743b
3
  size 90346763
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9aa4f63fab73d0181a0c9306b4976314c3fecfc2cc8c586e50cb9e5ef066cf9d
3
  size 90346763
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dffc0ceb65e8c69d366f764cae9f9d5143c5e98038853351451b525757197063
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:194afcbe1a7663b9e29766856c518f1adcc144fc5b40f9d65d44fac282c10ac3
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab6c56263d0a3d675d4f747bb77db752789302abc7e0c5864efa40f605c0194a
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8e232785d1786cb94e8889d9a79973e568b9bfb82c9ff8f8a12783934ff997c
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.508130081300813,
6
  "eval_steps": 500,
7
- "global_step": 1000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -148,6 +148,34 @@
148
  "learning_rate": 2.7357425183512143e-05,
149
  "loss": 0.501,
150
  "step": 1000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
151
  }
152
  ],
153
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.6097560975609756,
6
  "eval_steps": 500,
7
+ "global_step": 1200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
148
  "learning_rate": 2.7357425183512143e-05,
149
  "loss": 0.501,
150
  "step": 1000
151
+ },
152
+ {
153
+ "epoch": 0.5335365853658537,
154
+ "grad_norm": 1.7578125,
155
+ "learning_rate": 2.5945793337097685e-05,
156
+ "loss": 0.4843,
157
+ "step": 1050
158
+ },
159
+ {
160
+ "epoch": 0.5589430894308943,
161
+ "grad_norm": 1.9453125,
162
+ "learning_rate": 2.453416149068323e-05,
163
+ "loss": 0.496,
164
+ "step": 1100
165
+ },
166
+ {
167
+ "epoch": 0.584349593495935,
168
+ "grad_norm": 2.046875,
169
+ "learning_rate": 2.3122529644268774e-05,
170
+ "loss": 0.4878,
171
+ "step": 1150
172
+ },
173
+ {
174
+ "epoch": 0.6097560975609756,
175
+ "grad_norm": 1.875,
176
+ "learning_rate": 2.171089779785432e-05,
177
+ "loss": 0.4892,
178
+ "step": 1200
179
  }
180
  ],
181
  "logging_steps": 50,