guyhadad01 commited on
Commit
d798964
·
verified ·
1 Parent(s): c074dfe

Training in progress, step 600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -505,9 +505,9 @@ print(embeddings.shape)
505
  # Get the similarity scores for the embeddings
506
  similarities = model.similarity(embeddings, embeddings)
507
  print(similarities)
508
- # tensor([[ 1.0000, 0.6415, -0.0405],
509
- # [ 0.6415, 1.0000, -0.0528],
510
- # [-0.0405, -0.0528, 1.0000]])
511
  ```
512
 
513
  <!--
@@ -723,6 +723,10 @@ You can finetune this model on your own dataset.
723
  | 0.2879 | 300 | 0.4757 |
724
  | 0.3359 | 350 | 0.477 |
725
  | 0.3839 | 400 | 0.4604 |
 
 
 
 
726
 
727
 
728
  ### Framework Versions
 
505
  # Get the similarity scores for the embeddings
506
  similarities = model.similarity(embeddings, embeddings)
507
  print(similarities)
508
+ # tensor([[ 1.0000, 0.6584, -0.0531],
509
+ # [ 0.6584, 1.0000, -0.0991],
510
+ # [-0.0531, -0.0991, 1.0000]])
511
  ```
512
 
513
  <!--
 
723
  | 0.2879 | 300 | 0.4757 |
724
  | 0.3359 | 350 | 0.477 |
725
  | 0.3839 | 400 | 0.4604 |
726
+ | 0.4319 | 450 | 0.4363 |
727
+ | 0.4798 | 500 | 0.4291 |
728
+ | 0.5278 | 550 | 0.4192 |
729
+ | 0.5758 | 600 | 0.4287 |
730
 
731
 
732
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1e4673a236c95d0bc4a0ae5ca5eae4eee997d5826d21e669e6418ac6a733790
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:020d0d7176e467b6cd601d44d45bfdcd0927689574be8e5af96eafb7f39d4781
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d118b435f05009ed43f3d552c5b45865b77291129c0c33b6f607fed13185aa8b
3
  size 180608203
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f69755d55036a1c9c5e74b7da11093ccc408dc752b3193aa2c2a2920b5241214
3
  size 180608203
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44fe371788fff42378dd68792f5fdb6293656d333891448d1b8f5196e3c8fec7
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:930d5cc5a42dcd98e15dda5f0b8f8625912aaf157ec6f27c32761a0f3c4e311e
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df0af633a4f9f804af5866a99325014522ad3b38b189715886b1cb20a1e95ac1
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edab5dd7827df6c860a06cbc8d688873b247f37062ba5008ca6bb63249a0eb13
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.3838771593090211,
6
  "eval_steps": 500,
7
- "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -64,6 +64,34 @@
64
  "learning_rate": 3.431163287086446e-05,
65
  "loss": 0.4604,
66
  "step": 400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
67
  }
68
  ],
69
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.5758157389635317,
6
  "eval_steps": 500,
7
+ "global_step": 600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
64
  "learning_rate": 3.431163287086446e-05,
65
  "loss": 0.4604,
66
  "step": 400
67
+ },
68
+ {
69
+ "epoch": 0.43186180422264875,
70
+ "grad_norm": 1.7176055908203125,
71
+ "learning_rate": 3.16435432230523e-05,
72
+ "loss": 0.4363,
73
+ "step": 450
74
+ },
75
+ {
76
+ "epoch": 0.4798464491362764,
77
+ "grad_norm": 1.6267833709716797,
78
+ "learning_rate": 2.897545357524013e-05,
79
+ "loss": 0.4291,
80
+ "step": 500
81
+ },
82
+ {
83
+ "epoch": 0.527831094049904,
84
+ "grad_norm": 1.6887868642807007,
85
+ "learning_rate": 2.6307363927427965e-05,
86
+ "loss": 0.4192,
87
+ "step": 550
88
+ },
89
+ {
90
+ "epoch": 0.5758157389635317,
91
+ "grad_norm": 1.4798693656921387,
92
+ "learning_rate": 2.3639274279615796e-05,
93
+ "loss": 0.4287,
94
+ "step": 600
95
  }
96
  ],
97
  "logging_steps": 50,