guyhadad01 commited on
Commit
0ec3999
·
verified ·
1 Parent(s): a558da5

Training in progress, step 400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -505,9 +505,9 @@ print(embeddings.shape)
505
  # Get the similarity scores for the embeddings
506
  similarities = model.similarity(embeddings, embeddings)
507
  print(similarities)
508
- # tensor([[ 1.0000, 0.6097, -0.0412],
509
- # [ 0.6097, 1.0000, -0.0067],
510
- # [-0.0412, -0.0067, 1.0000]])
511
  ```
512
 
513
  <!--
@@ -719,6 +719,10 @@ You can finetune this model on your own dataset.
719
  | 0.0960 | 100 | 0.6884 |
720
  | 0.1440 | 150 | 0.5902 |
721
  | 0.1919 | 200 | 0.5362 |
 
 
 
 
722
 
723
 
724
  ### Framework Versions
 
505
  # Get the similarity scores for the embeddings
506
  similarities = model.similarity(embeddings, embeddings)
507
  print(similarities)
508
+ # tensor([[ 1.0000, 0.6415, -0.0405],
509
+ # [ 0.6415, 1.0000, -0.0528],
510
+ # [-0.0405, -0.0528, 1.0000]])
511
  ```
512
 
513
  <!--
 
719
  | 0.0960 | 100 | 0.6884 |
720
  | 0.1440 | 150 | 0.5902 |
721
  | 0.1919 | 200 | 0.5362 |
722
+ | 0.2399 | 250 | 0.5196 |
723
+ | 0.2879 | 300 | 0.4757 |
724
+ | 0.3359 | 350 | 0.477 |
725
+ | 0.3839 | 400 | 0.4604 |
726
 
727
 
728
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45678ca92701e2b21d762de3576e475d0d9a1bd02f16d5e2320057ec6fa09465
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1e4673a236c95d0bc4a0ae5ca5eae4eee997d5826d21e669e6418ac6a733790
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28e4b9ec6534cb3bfecf2195dc89b9aecba29d7b8f791ee24ecb9b2f2b2f1cf8
3
  size 180608203
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d118b435f05009ed43f3d552c5b45865b77291129c0c33b6f607fed13185aa8b
3
  size 180608203
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9bef9076975c77b5c8cc319158c1ecd2196bb244317040f0ca1f1eedc950136
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44fe371788fff42378dd68792f5fdb6293656d333891448d1b8f5196e3c8fec7
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d88407aff68ef8509234fd2211bb50888896b55849641ad9180c09511a40fab
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df0af633a4f9f804af5866a99325014522ad3b38b189715886b1cb20a1e95ac1
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.19193857965451055,
6
  "eval_steps": 500,
7
- "global_step": 200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -36,6 +36,34 @@
36
  "learning_rate": 4.4983991462113126e-05,
37
  "loss": 0.5362,
38
  "step": 200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
39
  }
40
  ],
41
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.3838771593090211,
6
  "eval_steps": 500,
7
+ "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
36
  "learning_rate": 4.4983991462113126e-05,
37
  "loss": 0.5362,
38
  "step": 200
39
+ },
40
+ {
41
+ "epoch": 0.2399232245681382,
42
+ "grad_norm": 1.8430039882659912,
43
+ "learning_rate": 4.231590181430096e-05,
44
+ "loss": 0.5196,
45
+ "step": 250
46
+ },
47
+ {
48
+ "epoch": 0.28790786948176583,
49
+ "grad_norm": 1.9631397724151611,
50
+ "learning_rate": 3.9647812166488794e-05,
51
+ "loss": 0.4757,
52
+ "step": 300
53
+ },
54
+ {
55
+ "epoch": 0.33589251439539347,
56
+ "grad_norm": 1.9073326587677002,
57
+ "learning_rate": 3.697972251867663e-05,
58
+ "loss": 0.477,
59
+ "step": 350
60
+ },
61
+ {
62
+ "epoch": 0.3838771593090211,
63
+ "grad_norm": 1.7632094621658325,
64
+ "learning_rate": 3.431163287086446e-05,
65
+ "loss": 0.4604,
66
+ "step": 400
67
  }
68
  ],
69
  "logging_steps": 50,