guyhadad01 commited on
Commit
0dcd9fc
·
verified ·
1 Parent(s): 64d999c

Training in progress, step 800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -505,9 +505,9 @@ print(embeddings.shape)
505
  # Get the similarity scores for the embeddings
506
  similarities = model.similarity(embeddings, embeddings)
507
  print(similarities)
508
- # tensor([[ 1.0000, 0.6584, -0.0531],
509
- # [ 0.6584, 1.0000, -0.0991],
510
- # [-0.0531, -0.0991, 1.0000]])
511
  ```
512
 
513
  <!--
@@ -727,6 +727,10 @@ You can finetune this model on your own dataset.
727
  | 0.4798 | 500 | 0.4291 |
728
  | 0.5278 | 550 | 0.4192 |
729
  | 0.5758 | 600 | 0.4287 |
 
 
 
 
730
 
731
 
732
  ### Framework Versions
 
505
  # Get the similarity scores for the embeddings
506
  similarities = model.similarity(embeddings, embeddings)
507
  print(similarities)
508
+ # tensor([[ 1.0000, 0.6636, -0.0516],
509
+ # [ 0.6636, 1.0000, -0.0845],
510
+ # [-0.0516, -0.0845, 1.0000]])
511
  ```
512
 
513
  <!--
 
727
  | 0.4798 | 500 | 0.4291 |
728
  | 0.5278 | 550 | 0.4192 |
729
  | 0.5758 | 600 | 0.4287 |
730
+ | 0.6238 | 650 | 0.4093 |
731
+ | 0.6718 | 700 | 0.4118 |
732
+ | 0.7198 | 750 | 0.3923 |
733
+ | 0.7678 | 800 | 0.4183 |
734
 
735
 
736
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:020d0d7176e467b6cd601d44d45bfdcd0927689574be8e5af96eafb7f39d4781
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff756dbb38a75171525943ee07a6245096eef361b8236a195a79e2f4c43e6b40
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f69755d55036a1c9c5e74b7da11093ccc408dc752b3193aa2c2a2920b5241214
3
  size 180608203
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:519486a3681858d50acde069f580d97e5840fa5ac9d65b3f042141bd25e1cb41
3
  size 180608203
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:930d5cc5a42dcd98e15dda5f0b8f8625912aaf157ec6f27c32761a0f3c4e311e
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f16fa28ebb8e3a1b82ca55c6cf1c0dd60b11d4021c7a97520baf445d2c84fd8
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edab5dd7827df6c860a06cbc8d688873b247f37062ba5008ca6bb63249a0eb13
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d57a1899b276deaf9bc6c347b576a36bf470824199b1d1731a5698c732cc5649
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.5758157389635317,
6
  "eval_steps": 500,
7
- "global_step": 600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -92,6 +92,34 @@
92
  "learning_rate": 2.3639274279615796e-05,
93
  "loss": 0.4287,
94
  "step": 600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
95
  }
96
  ],
97
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.7677543186180422,
6
  "eval_steps": 500,
7
+ "global_step": 800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
92
  "learning_rate": 2.3639274279615796e-05,
93
  "loss": 0.4287,
94
  "step": 600
95
+ },
96
+ {
97
+ "epoch": 0.6238003838771593,
98
+ "grad_norm": 1.5440646409988403,
99
+ "learning_rate": 2.097118463180363e-05,
100
+ "loss": 0.4093,
101
+ "step": 650
102
+ },
103
+ {
104
+ "epoch": 0.6717850287907869,
105
+ "grad_norm": 1.4985594749450684,
106
+ "learning_rate": 1.830309498399146e-05,
107
+ "loss": 0.4118,
108
+ "step": 700
109
+ },
110
+ {
111
+ "epoch": 0.7197696737044146,
112
+ "grad_norm": 1.6520227193832397,
113
+ "learning_rate": 1.5635005336179295e-05,
114
+ "loss": 0.3923,
115
+ "step": 750
116
+ },
117
+ {
118
+ "epoch": 0.7677543186180422,
119
+ "grad_norm": 1.6517823934555054,
120
+ "learning_rate": 1.2966915688367129e-05,
121
+ "loss": 0.4183,
122
+ "step": 800
123
  }
124
  ],
125
  "logging_steps": 50,