wuff-mann commited on
Commit
5171df8
·
verified ·
1 Parent(s): 1135c42

Upload sigma_lambda_proto_v1/history.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. sigma_lambda_proto_v1/history.json +26 -12
sigma_lambda_proto_v1/history.json CHANGED
@@ -3,84 +3,98 @@
3
  1,
4
  2,
5
  3,
6
- 4
 
7
  ],
8
  "gen_loss": [
9
  14.378914150180238,
10
  10.41937110927972,
11
  9.95253911739046,
12
- 9.72740114264416
 
13
  ],
14
  "ret_loss": [
15
  0.0,
16
  0.0,
17
  0.0,
 
18
  0.0
19
  ],
20
  "ppl": [
21
  105.51695237627168,
22
  36.01809758482572,
23
  29.905926998953085,
24
- 27.759728442854154
 
25
  ],
26
  "tf_acc": [
27
  0.44998506448388675,
28
  0.4889349317509485,
29
  0.5010759556689941,
30
- 0.5067917151141438
 
31
  ],
32
  "fr_acc": [
33
  0.15843538324420675,
34
  0.21595909319438727,
35
  0.22207020430549843,
36
- 0.17343382924265277
 
37
  ],
38
  "mrr": [
39
  0.01984136737883091,
40
  0.02093728445470333,
41
  0.021167319267988205,
42
- 0.02771509811282158
 
43
  ],
44
  "r1": [
45
  0.0031250000465661287,
46
  0.0031250000465661287,
47
  0.0031250000465661287,
48
- 0.00937500037252903
 
49
  ],
50
  "he_proxy": [
51
  0.0,
52
  0.0,
53
  0.0692528888652218,
 
54
  0.0
55
  ],
56
  "grad_norm": [
57
  69556.54960830766,
58
  524881.9476341035,
59
  129648.56937981857,
60
- 68050.81607155707
 
61
  ],
62
  "step_var": [
63
  0.2371368706226349,
64
  0.276157945394516,
65
  0.3243665397167206,
66
- 0.37456902861595154
 
67
  ],
68
  "pos_slope": [
69
  0.4982355535030365,
70
  0.4918489158153534,
71
  0.48427340388298035,
72
- 0.4768323302268982
 
73
  ],
74
  "beta_mean": [
75
  0.09964697062969208,
76
  0.0983697697520256,
77
  0.09685240685939789,
78
- 0.0953640341758728
 
79
  ],
80
  "w_ret": [
81
  0.0,
82
  0.0,
83
  0.0,
84
- 0.0
 
85
  ]
86
  }
 
3
  1,
4
  2,
5
  3,
6
+ 4,
7
+ 5
8
  ],
9
  "gen_loss": [
10
  14.378914150180238,
11
  10.41937110927972,
12
  9.95253911739046,
13
+ 9.72740114264416,
14
+ 9.55466846523863
15
  ],
16
  "ret_loss": [
17
  0.0,
18
  0.0,
19
  0.0,
20
+ 0.0,
21
  0.0
22
  ],
23
  "ppl": [
24
  105.51695237627168,
25
  36.01809758482572,
26
  29.905926998953085,
27
+ 27.759728442854154,
28
+ 26.567988921309055
29
  ],
30
  "tf_acc": [
31
  0.44998506448388675,
32
  0.4889349317509485,
33
  0.5010759556689941,
34
+ 0.5067917151141438,
35
+ 0.5109845416047981
36
  ],
37
  "fr_acc": [
38
  0.15843538324420675,
39
  0.21595909319438727,
40
  0.22207020430549843,
41
+ 0.17343382924265277,
42
+ 0.21467075734722796
43
  ],
44
  "mrr": [
45
  0.01984136737883091,
46
  0.02093728445470333,
47
  0.021167319267988205,
48
+ 0.02771509811282158,
49
+ 0.025447646155953407
50
  ],
51
  "r1": [
52
  0.0031250000465661287,
53
  0.0031250000465661287,
54
  0.0031250000465661287,
55
+ 0.00937500037252903,
56
+ 0.0031250000465661287
57
  ],
58
  "he_proxy": [
59
  0.0,
60
  0.0,
61
  0.0692528888652218,
62
+ 0.0,
63
  0.0
64
  ],
65
  "grad_norm": [
66
  69556.54960830766,
67
  524881.9476341035,
68
  129648.56937981857,
69
+ 68050.81607155707,
70
+ 164660.7477113645
71
  ],
72
  "step_var": [
73
  0.2371368706226349,
74
  0.276157945394516,
75
  0.3243665397167206,
76
+ 0.37456902861595154,
77
+ 0.4257376194000244
78
  ],
79
  "pos_slope": [
80
  0.4982355535030365,
81
  0.4918489158153534,
82
  0.48427340388298035,
83
+ 0.4768323302268982,
84
+ 0.4699003994464874
85
  ],
86
  "beta_mean": [
87
  0.09964697062969208,
88
  0.0983697697520256,
89
  0.09685240685939789,
90
+ 0.0953640341758728,
91
+ 0.09398408234119415
92
  ],
93
  "w_ret": [
94
  0.0,
95
  0.0,
96
  0.0,
97
+ 0.0,
98
+ 0.03
99
  ]
100
  }