wuff-mann commited on
Commit
b05c360
·
verified ·
1 Parent(s): 3780e4b

Upload sigma_lambda_proto_v4/history.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. sigma_lambda_proto_v4/history.json +29 -12
sigma_lambda_proto_v4/history.json CHANGED
@@ -15,7 +15,8 @@
15
  13,
16
  14,
17
  15,
18
- 16
 
19
  ],
20
  "gen_loss": [
21
  18.370433433850607,
@@ -33,7 +34,8 @@
33
  10.940823611346158,
34
  10.90196396784349,
35
  11.473219166524483,
36
- 11.477066975073381
 
37
  ],
38
  "ret_loss": [
39
  0.0,
@@ -51,7 +53,8 @@
51
  0.0,
52
  0.0,
53
  297885048197.7794,
54
- 185471042979.8594
 
55
  ],
56
  "ent_loss": [
57
  0.6078802872065342,
@@ -69,7 +72,8 @@
69
  0.5945930913000396,
70
  0.5991491057656028,
71
  0.6038948570959496,
72
- 0.6058890042521737
 
73
  ],
74
  "ppl": [
75
  40729.60576844635,
@@ -87,7 +91,8 @@
87
  48.41525029954994,
88
  47.256544770774525,
89
  57.93225257466221,
90
- 58.00014256149768
 
91
  ],
92
  "tf_acc": [
93
  9.249682110189831e-06,
@@ -105,7 +110,8 @@
105
  0.4732986161931464,
106
  0.47500545459195026,
107
  0.46299773491608087,
108
- 0.4629857647392324
 
109
  ],
110
  "fr_acc": [
111
  0.0,
@@ -123,7 +129,8 @@
123
  0.17980458818168835,
124
  0.14786793252599717,
125
  0.18805116826841511,
126
- 0.18621015772268792
 
127
  ],
128
  "def_rate": [
129
  0.0,
@@ -141,6 +148,7 @@
141
  1.0,
142
  0.95,
143
  1.0,
 
144
  1.0
145
  ],
146
  "mrr": [
@@ -159,7 +167,8 @@
159
  0.004978574346750975,
160
  0.004983400925993919,
161
  0.00775557104498148,
162
- 0.007759490050375462
 
163
  ],
164
  "r1": [
165
  0.0006249999860301614,
@@ -177,6 +186,7 @@
177
  0.0006249999860301614,
178
  0.0006249999860301614,
179
  0.0010416667209938169,
 
180
  0.0010416667209938169
181
  ],
182
  "ret_ok_pct": [
@@ -195,6 +205,7 @@
195
  0.0,
196
  0.0,
197
  100.0,
 
198
  100.0
199
  ],
200
  "grad_norm": [
@@ -213,6 +224,7 @@
213
  1172.9177006188306,
214
  1544.1169985122392,
215
  Infinity,
 
216
  Infinity
217
  ],
218
  "step_var": [
@@ -231,7 +243,8 @@
231
  0.2396431863307953,
232
  0.24049368500709534,
233
  0.2347075343132019,
234
- 0.23476119339466095
 
235
  ],
236
  "pos_slope": [
237
  0.49990350008010864,
@@ -249,7 +262,8 @@
249
  0.49562159180641174,
250
  0.49534475803375244,
251
  0.4971509277820587,
252
- 0.4969623386859894
 
253
  ],
254
  "beta_mean": [
255
  0.09998118132352829,
@@ -267,7 +281,8 @@
267
  0.09912104904651642,
268
  0.09906545281410217,
269
  0.09942715615034103,
270
- 0.0993889719247818
 
271
  ],
272
  "w_ret": [
273
  0.0,
@@ -285,10 +300,12 @@
285
  0.2,
286
  0.2,
287
  0.2,
 
288
  0.2
289
  ],
290
  "ret_raw": [
291
  297885048197.7794,
292
- 185471042979.8594
 
293
  ]
294
  }
 
15
  13,
16
  14,
17
  15,
18
+ 16,
19
+ 17
20
  ],
21
  "gen_loss": [
22
  18.370433433850607,
 
34
  10.940823611346158,
35
  10.90196396784349,
36
  11.473219166524483,
37
+ 11.477066975073381,
38
+ 11.481685707063386
39
  ],
40
  "ret_loss": [
41
  0.0,
 
53
  0.0,
54
  0.0,
55
  297885048197.7794,
56
+ 185471042979.8594,
57
+ 220422110895.04968
58
  ],
59
  "ent_loss": [
60
  0.6078802872065342,
 
72
  0.5945930913000396,
73
  0.5991491057656028,
74
  0.6038948570959496,
75
+ 0.6058890042521737,
76
+ 0.6026860457478147
77
  ],
78
  "ppl": [
79
  40729.60576844635,
 
91
  48.41525029954994,
92
  47.256544770774525,
93
  57.93225257466221,
94
+ 58.00014256149768,
95
+ 58.12945668251974
96
  ],
97
  "tf_acc": [
98
  9.249682110189831e-06,
 
110
  0.4732986161931464,
111
  0.47500545459195026,
112
  0.46299773491608087,
113
+ 0.4629857647392324,
114
+ 0.4629770591560699
115
  ],
116
  "fr_acc": [
117
  0.0,
 
129
  0.17980458818168835,
130
  0.14786793252599717,
131
  0.18805116826841511,
132
+ 0.18621015772268792,
133
+ 0.18743173221865267
134
  ],
135
  "def_rate": [
136
  0.0,
 
148
  1.0,
149
  0.95,
150
  1.0,
151
+ 1.0,
152
  1.0
153
  ],
154
  "mrr": [
 
167
  0.004978574346750975,
168
  0.004983400925993919,
169
  0.00775557104498148,
170
+ 0.007759490050375462,
171
+ 0.007763712666928768
172
  ],
173
  "r1": [
174
  0.0006249999860301614,
 
186
  0.0006249999860301614,
187
  0.0006249999860301614,
188
  0.0010416667209938169,
189
+ 0.0010416667209938169,
190
  0.0010416667209938169
191
  ],
192
  "ret_ok_pct": [
 
205
  0.0,
206
  0.0,
207
  100.0,
208
+ 100.0,
209
  100.0
210
  ],
211
  "grad_norm": [
 
224
  1172.9177006188306,
225
  1544.1169985122392,
226
  Infinity,
227
+ Infinity,
228
  Infinity
229
  ],
230
  "step_var": [
 
243
  0.2396431863307953,
244
  0.24049368500709534,
245
  0.2347075343132019,
246
+ 0.23476119339466095,
247
+ 0.2348354160785675
248
  ],
249
  "pos_slope": [
250
  0.49990350008010864,
 
262
  0.49562159180641174,
263
  0.49534475803375244,
264
  0.4971509277820587,
265
+ 0.4969623386859894,
266
+ 0.4967041313648224
267
  ],
268
  "beta_mean": [
269
  0.09998118132352829,
 
281
  0.09912104904651642,
282
  0.09906545281410217,
283
  0.09942715615034103,
284
+ 0.0993889719247818,
285
+ 0.09933643043041229
286
  ],
287
  "w_ret": [
288
  0.0,
 
300
  0.2,
301
  0.2,
302
  0.2,
303
+ 0.2,
304
  0.2
305
  ],
306
  "ret_raw": [
307
  297885048197.7794,
308
+ 185471042979.8594,
309
+ 220422110895.04968
310
  ]
311
  }