wuff-mann commited on
Commit
845819d
·
verified ·
1 Parent(s): c15dc36

Upload sigma_lambda_proto_v4/history.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. sigma_lambda_proto_v4/history.json +29 -12
sigma_lambda_proto_v4/history.json CHANGED
@@ -16,7 +16,8 @@
16
  14,
17
  15,
18
  16,
19
- 17
 
20
  ],
21
  "gen_loss": [
22
  18.370433433850607,
@@ -35,7 +36,8 @@
35
  10.90196396784349,
36
  11.473219166524483,
37
  11.477066975073381,
38
- 11.481685707063386
 
39
  ],
40
  "ret_loss": [
41
  0.0,
@@ -54,7 +56,8 @@
54
  0.0,
55
  297885048197.7794,
56
  185471042979.8594,
57
- 220422110895.04968
 
58
  ],
59
  "ent_loss": [
60
  0.6078802872065342,
@@ -73,7 +76,8 @@
73
  0.5991491057656028,
74
  0.6038948570959496,
75
  0.6058890042521737,
76
- 0.6026860457478147
 
77
  ],
78
  "ppl": [
79
  40729.60576844635,
@@ -92,7 +96,8 @@
92
  47.256544770774525,
93
  57.93225257466221,
94
  58.00014256149768,
95
- 58.12945668251974
 
96
  ],
97
  "tf_acc": [
98
  9.249682110189831e-06,
@@ -111,7 +116,8 @@
111
  0.47500545459195026,
112
  0.46299773491608087,
113
  0.4629857647392324,
114
- 0.4629770591560699
 
115
  ],
116
  "fr_acc": [
117
  0.0,
@@ -130,7 +136,8 @@
130
  0.14786793252599717,
131
  0.18805116826841511,
132
  0.18621015772268792,
133
- 0.18743173221865267
 
134
  ],
135
  "def_rate": [
136
  0.0,
@@ -149,6 +156,7 @@
149
  0.95,
150
  1.0,
151
  1.0,
 
152
  1.0
153
  ],
154
  "mrr": [
@@ -168,7 +176,8 @@
168
  0.004983400925993919,
169
  0.00775557104498148,
170
  0.007759490050375462,
171
- 0.007763712666928768
 
172
  ],
173
  "r1": [
174
  0.0006249999860301614,
@@ -187,6 +196,7 @@
187
  0.0006249999860301614,
188
  0.0010416667209938169,
189
  0.0010416667209938169,
 
190
  0.0010416667209938169
191
  ],
192
  "ret_ok_pct": [
@@ -206,6 +216,7 @@
206
  0.0,
207
  100.0,
208
  100.0,
 
209
  100.0
210
  ],
211
  "grad_norm": [
@@ -225,6 +236,7 @@
225
  1544.1169985122392,
226
  Infinity,
227
  Infinity,
 
228
  Infinity
229
  ],
230
  "step_var": [
@@ -244,7 +256,8 @@
244
  0.24049368500709534,
245
  0.2347075343132019,
246
  0.23476119339466095,
247
- 0.2348354160785675
 
248
  ],
249
  "pos_slope": [
250
  0.49990350008010864,
@@ -263,7 +276,8 @@
263
  0.49534475803375244,
264
  0.4971509277820587,
265
  0.4969623386859894,
266
- 0.4967041313648224
 
267
  ],
268
  "beta_mean": [
269
  0.09998118132352829,
@@ -282,7 +296,8 @@
282
  0.09906545281410217,
283
  0.09942715615034103,
284
  0.0993889719247818,
285
- 0.09933643043041229
 
286
  ],
287
  "w_ret": [
288
  0.0,
@@ -301,11 +316,13 @@
301
  0.2,
302
  0.2,
303
  0.2,
 
304
  0.2
305
  ],
306
  "ret_raw": [
307
  297885048197.7794,
308
  185471042979.8594,
309
- 220422110895.04968
 
310
  ]
311
  }
 
16
  14,
17
  15,
18
  16,
19
+ 17,
20
+ 18
21
  ],
22
  "gen_loss": [
23
  18.370433433850607,
 
36
  10.90196396784349,
37
  11.473219166524483,
38
  11.477066975073381,
39
+ 11.481685707063386,
40
+ 11.48563595049309
41
  ],
42
  "ret_loss": [
43
  0.0,
 
56
  0.0,
57
  297885048197.7794,
58
  185471042979.8594,
59
+ 220422110895.04968,
60
+ 190796641934.95273
61
  ],
62
  "ent_loss": [
63
  0.6078802872065342,
 
76
  0.5991491057656028,
77
  0.6038948570959496,
78
  0.6058890042521737,
79
+ 0.6026860457478147,
80
+ 0.604040896025571
81
  ],
82
  "ppl": [
83
  40729.60576844635,
 
96
  47.256544770774525,
97
  57.93225257466221,
98
  58.00014256149768,
99
+ 58.12945668251974,
100
+ 58.12488720995803
101
  ],
102
  "tf_acc": [
103
  9.249682110189831e-06,
 
116
  0.47500545459195026,
117
  0.46299773491608087,
118
  0.4629857647392324,
119
+ 0.4629770591560699,
120
+ 0.46299773491608087
121
  ],
122
  "fr_acc": [
123
  0.0,
 
136
  0.14786793252599717,
137
  0.18805116826841511,
138
  0.18621015772268792,
139
+ 0.18743173221865267,
140
+ 0.18079325223458445
141
  ],
142
  "def_rate": [
143
  0.0,
 
156
  0.95,
157
  1.0,
158
  1.0,
159
+ 1.0,
160
  1.0
161
  ],
162
  "mrr": [
 
176
  0.004983400925993919,
177
  0.00775557104498148,
178
  0.007759490050375462,
179
+ 0.007763712666928768,
180
+ 0.007745448965579271
181
  ],
182
  "r1": [
183
  0.0006249999860301614,
 
196
  0.0006249999860301614,
197
  0.0010416667209938169,
198
  0.0010416667209938169,
199
+ 0.0010416667209938169,
200
  0.0010416667209938169
201
  ],
202
  "ret_ok_pct": [
 
216
  0.0,
217
  100.0,
218
  100.0,
219
+ 100.0,
220
  100.0
221
  ],
222
  "grad_norm": [
 
236
  1544.1169985122392,
237
  Infinity,
238
  Infinity,
239
+ Infinity,
240
  Infinity
241
  ],
242
  "step_var": [
 
256
  0.24049368500709534,
257
  0.2347075343132019,
258
  0.23476119339466095,
259
+ 0.2348354160785675,
260
+ 0.2349209189414978
261
  ],
262
  "pos_slope": [
263
  0.49990350008010864,
 
276
  0.49534475803375244,
277
  0.4971509277820587,
278
  0.4969623386859894,
279
+ 0.4967041313648224,
280
+ 0.49640679359436035
281
  ],
282
  "beta_mean": [
283
  0.09998118132352829,
 
296
  0.09906545281410217,
297
  0.09942715615034103,
298
  0.0993889719247818,
299
+ 0.09933643043041229,
300
+ 0.09927636384963989
301
  ],
302
  "w_ret": [
303
  0.0,
 
316
  0.2,
317
  0.2,
318
  0.2,
319
+ 0.2,
320
  0.2
321
  ],
322
  "ret_raw": [
323
  297885048197.7794,
324
  185471042979.8594,
325
+ 220422110895.04968,
326
+ 190796641934.95273
327
  ]
328
  }