wuff-mann commited on
Commit
f00ad34
·
verified ·
1 Parent(s): 85e31ba

Upload sigma_lambda_proto_v1/history.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. sigma_lambda_proto_v1/history.json +26 -12
sigma_lambda_proto_v1/history.json CHANGED
@@ -5,7 +5,8 @@
5
  3,
6
  4,
7
  5,
8
- 6
 
9
  ],
10
  "gen_loss": [
11
  14.378914150180238,
@@ -13,7 +14,8 @@
13
  9.95253911739046,
14
  9.72740114264416,
15
  9.55466846523863,
16
- 9.424415427897916
 
17
  ],
18
  "ret_loss": [
19
  0.0,
@@ -21,6 +23,7 @@
21
  0.0,
22
  0.0,
23
  0.0,
 
24
  0.0
25
  ],
26
  "ppl": [
@@ -29,7 +32,8 @@
29
  29.905926998953085,
30
  27.759728442854154,
31
  26.567988921309055,
32
- 25.650242317335714
 
33
  ],
34
  "tf_acc": [
35
  0.44998506448388675,
@@ -37,7 +41,8 @@
37
  0.5010759556689941,
38
  0.5067917151141438,
39
  0.5109845416047981,
40
- 0.5145881089351385
 
41
  ],
42
  "fr_acc": [
43
  0.15843538324420675,
@@ -45,7 +50,8 @@
45
  0.22207020430549843,
46
  0.17343382924265277,
47
  0.21467075734722796,
48
- 0.132664598473422
 
49
  ],
50
  "mrr": [
51
  0.01984136737883091,
@@ -53,7 +59,8 @@
53
  0.021167319267988205,
54
  0.02771509811282158,
55
  0.025447646155953407,
56
- 0.028147408738732338
 
57
  ],
58
  "r1": [
59
  0.0031250000465661287,
@@ -61,6 +68,7 @@
61
  0.0031250000465661287,
62
  0.00937500037252903,
63
  0.0031250000465661287,
 
64
  0.0031250000465661287
65
  ],
66
  "he_proxy": [
@@ -69,7 +77,8 @@
69
  0.0692528888652218,
70
  0.0,
71
  0.0,
72
- 0.067495606794824
 
73
  ],
74
  "grad_norm": [
75
  69556.54960830766,
@@ -77,7 +86,8 @@
77
  129648.56937981857,
78
  68050.81607155707,
79
  164660.7477113645,
80
- 169132.88870452382
 
81
  ],
82
  "step_var": [
83
  0.2371368706226349,
@@ -85,7 +95,8 @@
85
  0.3243665397167206,
86
  0.37456902861595154,
87
  0.4257376194000244,
88
- 0.47667616605758667
 
89
  ],
90
  "pos_slope": [
91
  0.4982355535030365,
@@ -93,7 +104,8 @@
93
  0.48427340388298035,
94
  0.4768323302268982,
95
  0.4699003994464874,
96
- 0.4636712968349457
 
97
  ],
98
  "beta_mean": [
99
  0.09964697062969208,
@@ -101,7 +113,8 @@
101
  0.09685240685939789,
102
  0.0953640341758728,
103
  0.09398408234119415,
104
- 0.09273404628038406
 
105
  ],
106
  "w_ret": [
107
  0.0,
@@ -109,6 +122,7 @@
109
  0.0,
110
  0.0,
111
  0.03,
112
- 0.06
 
113
  ]
114
  }
 
5
  3,
6
  4,
7
  5,
8
+ 6,
9
+ 7
10
  ],
11
  "gen_loss": [
12
  14.378914150180238,
 
14
  9.95253911739046,
15
  9.72740114264416,
16
  9.55466846523863,
17
+ 9.424415427897916,
18
+ 9.337661864071181
19
  ],
20
  "ret_loss": [
21
  0.0,
 
23
  0.0,
24
  0.0,
25
  0.0,
26
+ 0.0,
27
  0.0
28
  ],
29
  "ppl": [
 
32
  29.905926998953085,
33
  27.759728442854154,
34
  26.567988921309055,
35
+ 25.650242317335714,
36
+ 25.075453392796494
37
  ],
38
  "tf_acc": [
39
  0.44998506448388675,
 
41
  0.5010759556689941,
42
  0.5067917151141438,
43
  0.5109845416047981,
44
+ 0.5145881089351385,
45
+ 0.5173037067829007
46
  ],
47
  "fr_acc": [
48
  0.15843538324420675,
 
50
  0.22207020430549843,
51
  0.17343382924265277,
52
  0.21467075734722796,
53
+ 0.132664598473422,
54
+ 0.2427502285296403
55
  ],
56
  "mrr": [
57
  0.01984136737883091,
 
59
  0.021167319267988205,
60
  0.02771509811282158,
61
  0.025447646155953407,
62
+ 0.028147408738732338,
63
+ 0.031810443848371506
64
  ],
65
  "r1": [
66
  0.0031250000465661287,
 
68
  0.0031250000465661287,
69
  0.00937500037252903,
70
  0.0031250000465661287,
71
+ 0.0031250000465661287,
72
  0.0031250000465661287
73
  ],
74
  "he_proxy": [
 
77
  0.0692528888652218,
78
  0.0,
79
  0.0,
80
+ 0.067495606794824,
81
+ 0.0
82
  ],
83
  "grad_norm": [
84
  69556.54960830766,
 
86
  129648.56937981857,
87
  68050.81607155707,
88
  164660.7477113645,
89
+ 169132.88870452382,
90
+ 347530.32776330994
91
  ],
92
  "step_var": [
93
  0.2371368706226349,
 
95
  0.3243665397167206,
96
  0.37456902861595154,
97
  0.4257376194000244,
98
+ 0.47667616605758667,
99
+ 0.5235044360160828
100
  ],
101
  "pos_slope": [
102
  0.4982355535030365,
 
104
  0.48427340388298035,
105
  0.4768323302268982,
106
  0.4699003994464874,
107
+ 0.4636712968349457,
108
+ 0.4582301080226898
109
  ],
110
  "beta_mean": [
111
  0.09964697062969208,
 
113
  0.09685240685939789,
114
  0.0953640341758728,
115
  0.09398408234119415,
116
+ 0.09273404628038406,
117
+ 0.09163296222686768
118
  ],
119
  "w_ret": [
120
  0.0,
 
122
  0.0,
123
  0.0,
124
  0.03,
125
+ 0.06,
126
+ 0.09
127
  ]
128
  }