wuff-mann commited on
Commit
efb3b00
·
verified ·
1 Parent(s): 9b4085b

Upload sigma_lambda_v3/history.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. sigma_lambda_v3/history.json +21 -9
sigma_lambda_v3/history.json CHANGED
@@ -3,72 +3,84 @@
3
  1,
4
  2,
5
  3,
6
- 4
 
7
  ],
8
  "gen_loss": [
9
  30.399562595346868,
10
  22.764286764869794,
11
  15.396741087545925,
12
- 13.480450591629728
 
13
  ],
14
  "ret_loss": [
15
  796116674.0579515,
16
  5450725.260929077,
17
  350043.1876737281,
18
- 108628.19653386119
 
19
  ],
20
  "ppl": [
21
  48361.553911128496,
22
  10405.292656771971,
23
  1254.1789620978543,
24
- 264.47601817816616
 
25
  ],
26
  "tf_acc": [
27
  9.734349599431513e-06,
28
  0.39589275342567987,
29
  0.4354401710649703,
30
- 0.44354888428129674
 
31
  ],
32
  "fr_acc": [
33
  0.0,
34
  0.160561711572741,
35
  0.23937194341606105,
 
36
  0.23937194341606105
37
  ],
38
  "mrr": [
39
  0.007931923493742943,
40
  0.008492429740726948,
41
  0.00886960793286562,
42
- 0.009372583590447903
 
43
  ],
44
  "r1": [
45
  0.0010416667209938169,
46
  0.0010416667209938169,
47
  0.0010416667209938169,
 
48
  0.0010416667209938169
49
  ],
50
  "step_var": [
51
  0.15913955867290497,
52
  0.1598370373249054,
53
  0.16560138761997223,
54
- 0.17514024674892426
 
55
  ],
56
  "pos_slope": [
57
  0.4995734989643097,
58
  0.4980151951313019,
59
  0.4959738850593567,
60
- 0.49392592906951904
 
61
  ],
62
  "grad_norm": [
63
  2887832256709451.0,
64
  NaN,
65
  NaN,
 
66
  NaN
67
  ],
68
  "w_ret": [
69
  0.05,
70
  0.05,
71
  0.05,
72
- 0.083
 
73
  ]
74
  }
 
3
  1,
4
  2,
5
  3,
6
+ 4,
7
+ 5
8
  ],
9
  "gen_loss": [
10
  30.399562595346868,
11
  22.764286764869794,
12
  15.396741087545925,
13
+ 13.480450591629728,
14
+ 13.051396704105676
15
  ],
16
  "ret_loss": [
17
  796116674.0579515,
18
  5450725.260929077,
19
  350043.1876737281,
20
+ 108628.19653386119,
21
+ 58865.573026343496
22
  ],
23
  "ppl": [
24
  48361.553911128496,
25
  10405.292656771971,
26
  1254.1789620978543,
27
+ 264.47601817816616,
28
+ 127.8872290404574
29
  ],
30
  "tf_acc": [
31
  9.734349599431513e-06,
32
  0.39589275342567987,
33
  0.4354401710649703,
34
+ 0.44354888428129674,
35
+ 0.4487827195825911
36
  ],
37
  "fr_acc": [
38
  0.0,
39
  0.160561711572741,
40
  0.23937194341606105,
41
+ 0.23937194341606105,
42
  0.23937194341606105
43
  ],
44
  "mrr": [
45
  0.007931923493742943,
46
  0.008492429740726948,
47
  0.00886960793286562,
48
+ 0.009372583590447903,
49
+ 0.010170594789087772
50
  ],
51
  "r1": [
52
  0.0010416667209938169,
53
  0.0010416667209938169,
54
  0.0010416667209938169,
55
+ 0.0010416667209938169,
56
  0.0010416667209938169
57
  ],
58
  "step_var": [
59
  0.15913955867290497,
60
  0.1598370373249054,
61
  0.16560138761997223,
62
+ 0.17514024674892426,
63
+ 0.18433114886283875
64
  ],
65
  "pos_slope": [
66
  0.4995734989643097,
67
  0.4980151951313019,
68
  0.4959738850593567,
69
+ 0.49392592906951904,
70
+ 0.4921555817127228
71
  ],
72
  "grad_norm": [
73
  2887832256709451.0,
74
  NaN,
75
  NaN,
76
+ NaN,
77
  NaN
78
  ],
79
  "w_ret": [
80
  0.05,
81
  0.05,
82
  0.05,
83
+ 0.083,
84
+ 0.116
85
  ]
86
  }