SIGMA / sigma_lambda_v5 /history.json
wuff-mann's picture
Upload sigma_lambda_v5/history.json with huggingface_hub
6032be6 verified
raw
history blame
3.5 kB
Invalid JSON:Unexpected token 'N', ..."m": [ NaN, N"... is not valid JSON
{
"epoch": [
1,
2,
3,
4,
5,
6,
7,
4,
5,
6,
7,
8,
9,
10
],
"gen_loss": [
16.586591267879488,
22.012301083468923,
50.61838954157162,
114.44467188566325,
205.98175486637822,
333.0307641626024,
465.32868966012995,
48.11255316601957,
74.47382958961273,
116.53298210471324,
170.46740706801785,
214.5222631372081,
274.12421057906226,
323.5490314494401
],
"ret_loss": [
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0
],
"ppl": [
89.82908441173188,
160.04577946159412,
15470.654177938472,
485165195.4097903,
485165195.4097903,
485165195.4097903,
485165195.4097903,
15048.086253037915,
1624266.5983328498,
485165195.4097903,
485165195.4097903,
485165195.4097903,
485165195.4097903,
485165195.4097903
],
"tf_acc": [
0.46026214386231185,
0.47643615492864355,
0.47478209936121774,
0.4664326184178535,
0.4302312730702071,
0.4411152534131013,
0.4291537424388662,
0.4800979171424993,
0.4732017211019178,
0.46131388743580864,
0.45428323030789747,
0.44858981632247086,
0.44045584150537476,
0.41316392464284923
],
"fr_acc": [
0.12302286153389094,
0.11233910085013026,
0.24578219982631747,
0.2376122651857946,
0.13397800116550115,
0.1528195558526441,
0.04862503713606654,
0.2002858762969057,
0.24578219982631747,
0.27369709538827186,
0.12652472119383884,
0.14813148452854336,
0.1719167780748663,
0.1009754644864939
],
"mrr": [
0.006059600971639156,
0.006043825298547745,
0.006044529378414154,
0.006051086820662022,
0.006043311208486557,
0.0060408106073737144,
0.006041784770786762,
0.0060499003157019615,
0.006042419467121363,
0.006052091252058744,
0.006054983474314213,
0.006042384542524815,
0.006041090935468674,
0.006040983833372593
],
"r1": [
0.0007812500116415322,
0.0007812500116415322,
0.0007812500116415322,
0.0007812500116415322,
0.0007812500116415322,
0.0007812500116415322,
0.0007812500116415322,
0.0007812500116415322,
0.0007812500116415322,
0.0007812500116415322,
0.0007812500116415322,
0.0007812500116415322,
0.0007812500116415322,
0.0007812500116415322
],
"step_var": [
0.16505937278270721,
0.18193045258522034,
0.20552654564380646,
0.23860830068588257,
0.2775871157646179,
0.312656432390213,
0.34328973293304443,
0.20889317989349365,
0.22339501976966858,
0.24468941986560822,
0.26731032133102417,
0.28763458132743835,
0.3055805563926697,
0.32141008973121643
],
"pos_slope": [
0.4985616207122803,
0.4935553967952728,
0.48772382736206055,
0.48204389214515686,
0.47680673003196716,
0.47214341163635254,
0.46813833713531494,
0.48697665333747864,
0.48436233401298523,
0.4812909960746765,
0.4783017337322235,
0.47553473711013794,
0.47306424379348755,
0.47092458605766296
],
"grad_norm": [
NaN,
NaN,
NaN,
NaN,
NaN,
NaN,
NaN,
NaN,
NaN,
NaN,
NaN,
Infinity,
Infinity,
Infinity
],
"w_ret": [
0.0,
0.0,
0.0,
0.01,
0.02,
0.03,
0.04,
0.01,
0.02,
0.03,
0.04,
0.05,
0.08,
0.08
]
}