guyhadad01 commited on
Commit
d922c77
·
verified ·
1 Parent(s): ccacbd8

Training in progress, step 1000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -505,9 +505,9 @@ print(embeddings.shape)
505
  # Get the similarity scores for the embeddings
506
  similarities = model.similarity(embeddings, embeddings)
507
  print(similarities)
508
- # tensor([[ 1.0000, 0.6636, -0.0516],
509
- # [ 0.6636, 1.0000, -0.0845],
510
- # [-0.0516, -0.0845, 1.0000]])
511
  ```
512
 
513
  <!--
@@ -731,6 +731,10 @@ You can finetune this model on your own dataset.
731
  | 0.6718 | 700 | 0.4118 |
732
  | 0.7198 | 750 | 0.3923 |
733
  | 0.7678 | 800 | 0.4183 |
 
 
 
 
734
 
735
 
736
  ### Framework Versions
 
505
  # Get the similarity scores for the embeddings
506
  similarities = model.similarity(embeddings, embeddings)
507
  print(similarities)
508
+ # tensor([[ 1.0000, 0.6589, -0.0461],
509
+ # [ 0.6589, 1.0000, -0.0710],
510
+ # [-0.0461, -0.0710, 1.0000]])
511
  ```
512
 
513
  <!--
 
731
  | 0.6718 | 700 | 0.4118 |
732
  | 0.7198 | 750 | 0.3923 |
733
  | 0.7678 | 800 | 0.4183 |
734
+ | 0.8157 | 850 | 0.3991 |
735
+ | 0.8637 | 900 | 0.3947 |
736
+ | 0.9117 | 950 | 0.3777 |
737
+ | 0.9597 | 1000 | 0.3942 |
738
 
739
 
740
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff756dbb38a75171525943ee07a6245096eef361b8236a195a79e2f4c43e6b40
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16ed94def781e3941dec110dda20c76143833c045568e9b68f20230a6ae8dd0e
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:519486a3681858d50acde069f580d97e5840fa5ac9d65b3f042141bd25e1cb41
3
  size 180608203
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:109c98bb23626540dc184662d8b7b94cc56388db552e4887f65978941a59d183
3
  size 180608203
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f16fa28ebb8e3a1b82ca55c6cf1c0dd60b11d4021c7a97520baf445d2c84fd8
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f906e0b5b6d6a9c4fe87955d19f0e941b5338d2f71853b6ff2c15b409507ceee
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d57a1899b276deaf9bc6c347b576a36bf470824199b1d1731a5698c732cc5649
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f05941cd5d89b2195b06001cebc4cb31c0ae73bf191526abcbbf01177ebf8dc
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7677543186180422,
6
  "eval_steps": 500,
7
- "global_step": 800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -120,6 +120,34 @@
120
  "learning_rate": 1.2966915688367129e-05,
121
  "loss": 0.4183,
122
  "step": 800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
123
  }
124
  ],
125
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9596928982725528,
6
  "eval_steps": 500,
7
+ "global_step": 1000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
120
  "learning_rate": 1.2966915688367129e-05,
121
  "loss": 0.4183,
122
  "step": 800
123
+ },
124
+ {
125
+ "epoch": 0.8157389635316699,
126
+ "grad_norm": 1.7299295663833618,
127
+ "learning_rate": 1.0298826040554963e-05,
128
+ "loss": 0.3991,
129
+ "step": 850
130
+ },
131
+ {
132
+ "epoch": 0.8637236084452975,
133
+ "grad_norm": 1.717519998550415,
134
+ "learning_rate": 7.630736392742796e-06,
135
+ "loss": 0.3947,
136
+ "step": 900
137
+ },
138
+ {
139
+ "epoch": 0.9117082533589251,
140
+ "grad_norm": 1.5044348239898682,
141
+ "learning_rate": 4.96264674493063e-06,
142
+ "loss": 0.3777,
143
+ "step": 950
144
+ },
145
+ {
146
+ "epoch": 0.9596928982725528,
147
+ "grad_norm": 1.5577826499938965,
148
+ "learning_rate": 2.294557097118463e-06,
149
+ "loss": 0.3942,
150
+ "step": 1000
151
  }
152
  ],
153
  "logging_steps": 50,