lucienbaumgartner commited on
Commit
b4c58b2
·
verified ·
1 Parent(s): e33da67

Add SetFit model

Browse files
Files changed (3) hide show
  1. README.md +13 -74
  2. model.safetensors +1 -1
  3. model_head.pkl +1 -1
README.md CHANGED
@@ -148,7 +148,7 @@ preds = model("it contradicted itself")
148
 
149
  ### Training Hyperparameters
150
  - batch_size: (16, 16)
151
- - num_epochs: (10, 10)
152
  - max_steps: -1
153
  - sampling_strategy: oversampling
154
  - num_iterations: 20
@@ -169,82 +169,21 @@ preds = model("it contradicted itself")
169
  | Epoch | Step | Training Loss | Validation Loss |
170
  |:------:|:----:|:-------------:|:---------------:|
171
  | 0.0026 | 1 | 0.2637 | - |
172
- | 0.1316 | 50 | 0.2322 | - |
173
- | 0.2632 | 100 | 0.1836 | - |
174
- | 0.3947 | 150 | 0.0803 | - |
175
- | 0.5263 | 200 | 0.016 | - |
176
- | 0.6579 | 250 | 0.0062 | - |
177
- | 0.7895 | 300 | 0.0016 | - |
178
- | 0.9211 | 350 | 0.0028 | - |
179
- | 1.0526 | 400 | 0.0006 | - |
180
- | 1.1842 | 450 | 0.0019 | - |
181
- | 1.3158 | 500 | 0.0013 | - |
182
- | 1.4474 | 550 | 0.0012 | - |
183
- | 1.5789 | 600 | 0.0003 | - |
184
  | 1.7105 | 650 | 0.0003 | - |
185
  | 1.8421 | 700 | 0.0002 | - |
186
  | 1.9737 | 750 | 0.0002 | - |
187
- | 2.1053 | 800 | 0.0001 | - |
188
- | 2.2368 | 850 | 0.0001 | - |
189
- | 2.3684 | 900 | 0.0001 | - |
190
- | 2.5 | 950 | 0.0001 | - |
191
- | 2.6316 | 1000 | 0.0002 | - |
192
- | 2.7632 | 1050 | 0.0001 | - |
193
- | 2.8947 | 1100 | 0.0001 | - |
194
- | 3.0263 | 1150 | 0.0001 | - |
195
- | 3.1579 | 1200 | 0.0001 | - |
196
- | 3.2895 | 1250 | 0.0001 | - |
197
- | 3.4211 | 1300 | 0.0001 | - |
198
- | 3.5526 | 1350 | 0.0001 | - |
199
- | 3.6842 | 1400 | 0.0001 | - |
200
- | 3.8158 | 1450 | 0.0001 | - |
201
- | 3.9474 | 1500 | 0.0001 | - |
202
- | 4.0789 | 1550 | 0.0001 | - |
203
- | 4.2105 | 1600 | 0.0001 | - |
204
- | 4.3421 | 1650 | 0.0001 | - |
205
- | 4.4737 | 1700 | 0.0001 | - |
206
- | 4.6053 | 1750 | 0.0001 | - |
207
- | 4.7368 | 1800 | 0.0001 | - |
208
- | 4.8684 | 1850 | 0.0001 | - |
209
- | 5.0 | 1900 | 0.0001 | - |
210
- | 5.1316 | 1950 | 0.0001 | - |
211
- | 5.2632 | 2000 | 0.0001 | - |
212
- | 5.3947 | 2050 | 0.0001 | - |
213
- | 5.5263 | 2100 | 0.0001 | - |
214
- | 5.6579 | 2150 | 0.0001 | - |
215
- | 5.7895 | 2200 | 0.0001 | - |
216
- | 5.9211 | 2250 | 0.0001 | - |
217
- | 6.0526 | 2300 | 0.0001 | - |
218
- | 6.1842 | 2350 | 0.0001 | - |
219
- | 6.3158 | 2400 | 0.0001 | - |
220
- | 6.4474 | 2450 | 0.0001 | - |
221
- | 6.5789 | 2500 | 0.0001 | - |
222
- | 6.7105 | 2550 | 0.0001 | - |
223
- | 6.8421 | 2600 | 0.0001 | - |
224
- | 6.9737 | 2650 | 0.0001 | - |
225
- | 7.1053 | 2700 | 0.0001 | - |
226
- | 7.2368 | 2750 | 0.0001 | - |
227
- | 7.3684 | 2800 | 0.0001 | - |
228
- | 7.5 | 2850 | 0.0001 | - |
229
- | 7.6316 | 2900 | 0.0001 | - |
230
- | 7.7632 | 2950 | 0.0001 | - |
231
- | 7.8947 | 3000 | 0.0001 | - |
232
- | 8.0263 | 3050 | 0.0001 | - |
233
- | 8.1579 | 3100 | 0.0001 | - |
234
- | 8.2895 | 3150 | 0.0001 | - |
235
- | 8.4211 | 3200 | 0.0001 | - |
236
- | 8.5526 | 3250 | 0.0 | - |
237
- | 8.6842 | 3300 | 0.0001 | - |
238
- | 8.8158 | 3350 | 0.0001 | - |
239
- | 8.9474 | 3400 | 0.0001 | - |
240
- | 9.0789 | 3450 | 0.0 | - |
241
- | 9.2105 | 3500 | 0.0 | - |
242
- | 9.3421 | 3550 | 0.0 | - |
243
- | 9.4737 | 3600 | 0.0001 | - |
244
- | 9.6053 | 3650 | 0.0001 | - |
245
- | 9.7368 | 3700 | 0.0 | - |
246
- | 9.8684 | 3750 | 0.0 | - |
247
- | 10.0 | 3800 | 0.0 | - |
248
 
249
  ### Framework Versions
250
  - Python: 3.11.9
 
148
 
149
  ### Training Hyperparameters
150
  - batch_size: (16, 16)
151
+ - num_epochs: (2, 2)
152
  - max_steps: -1
153
  - sampling_strategy: oversampling
154
  - num_iterations: 20
 
169
  | Epoch | Step | Training Loss | Validation Loss |
170
  |:------:|:----:|:-------------:|:---------------:|
171
  | 0.0026 | 1 | 0.2637 | - |
172
+ | 0.1316 | 50 | 0.2039 | - |
173
+ | 0.2632 | 100 | 0.0495 | - |
174
+ | 0.3947 | 150 | 0.0032 | - |
175
+ | 0.5263 | 200 | 0.0022 | - |
176
+ | 0.6579 | 250 | 0.0005 | - |
177
+ | 0.7895 | 300 | 0.0004 | - |
178
+ | 0.9211 | 350 | 0.002 | - |
179
+ | 1.0526 | 400 | 0.0003 | - |
180
+ | 1.1842 | 450 | 0.0012 | - |
181
+ | 1.3158 | 500 | 0.0007 | - |
182
+ | 1.4474 | 550 | 0.001 | - |
183
+ | 1.5789 | 600 | 0.0004 | - |
184
  | 1.7105 | 650 | 0.0003 | - |
185
  | 1.8421 | 700 | 0.0002 | - |
186
  | 1.9737 | 750 | 0.0002 | - |
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
187
 
188
  ### Framework Versions
189
  - Python: 3.11.9
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78e9c05b1a6371b2835cca3f7b00cb72894e6d80b350f78ae2849f9111476085
3
  size 437967672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:305ef987ea30da31bc4711f32ab255ddb23d5e26d1f78bf40174c77780ee8dbe
3
  size 437967672
model_head.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1167cafb1d56dc5beb298f6d211d78a09d161820cccc1f3a5a28af35cbecb85
3
  size 19855
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a78176d8f7350bd666675cfa5514ed5cb1602d3a028135fa11d44a3218ab168
3
  size 19855