wuff-mann commited on
Commit
e373a9e
·
verified ·
1 Parent(s): 192eae8

Upload sigma_lambda_proto_v3/history.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. sigma_lambda_proto_v3/history.json +28 -12
sigma_lambda_proto_v3/history.json CHANGED
@@ -6,7 +6,8 @@
6
  4,
7
  5,
8
  6,
9
- 7
 
10
  ],
11
  "gen_loss": [
12
  18.370433433850607,
@@ -15,7 +16,8 @@
15
  11.843723264174027,
16
  11.67701819376512,
17
  11.95506536512664,
18
- 11.651441534504746
 
19
  ],
20
  "ret_loss": [
21
  0.0,
@@ -24,6 +26,7 @@
24
  0.0,
25
  0.0,
26
  0.0,
 
27
  0.0
28
  ],
29
  "ent_loss": [
@@ -33,7 +36,8 @@
33
  0.6162352153026697,
34
  0.6095350569667238,
35
  0.6105213370467677,
36
- 0.6074923021143133
 
37
  ],
38
  "ppl": [
39
  40729.60576844635,
@@ -42,7 +46,8 @@
42
  123.54939191255174,
43
  81.4022446898097,
44
  73.53574793147658,
45
- 66.62547611610893
 
46
  ],
47
  "tf_acc": [
48
  9.249682110189831e-06,
@@ -51,7 +56,8 @@
51
  0.4409562865464462,
52
  0.4514476024551921,
53
  0.4529803291907453,
54
- 0.4559930050639289
 
55
  ],
56
  "fr_acc": [
57
  0.0,
@@ -60,7 +66,8 @@
60
  0.09257571660973458,
61
  0.1671656922337565,
62
  0.16827387097913035,
63
- 0.1727579081837558
 
64
  ],
65
  "def_rate": [
66
  0.0,
@@ -69,6 +76,7 @@
69
  0.45,
70
  1.0,
71
  1.0,
 
72
  1.0
73
  ],
74
  "mrr": [
@@ -78,7 +86,8 @@
78
  0.004980043042451143,
79
  0.004973841365426779,
80
  0.004973897710442543,
81
- 0.004973262082785368
 
82
  ],
83
  "r1": [
84
  0.0006249999860301614,
@@ -87,6 +96,7 @@
87
  0.0006249999860301614,
88
  0.0006249999860301614,
89
  0.0006249999860301614,
 
90
  0.0006249999860301614
91
  ],
92
  "ret_ok_pct": [
@@ -96,6 +106,7 @@
96
  0.0,
97
  0.0,
98
  0.0,
 
99
  0.0
100
  ],
101
  "grad_norm": [
@@ -105,7 +116,8 @@
105
  1217.5837738567411,
106
  1152.3023670419057,
107
  2138.4472111783607,
108
- 1115.3582513533938
 
109
  ],
110
  "step_var": [
111
  0.22542811930179596,
@@ -114,7 +126,8 @@
114
  0.22952058911323547,
115
  0.23098886013031006,
116
  0.23129060864448547,
117
- 0.23215171694755554
 
118
  ],
119
  "pos_slope": [
120
  0.49990350008010864,
@@ -123,7 +136,8 @@
123
  0.4988322854042053,
124
  0.4983888268470764,
125
  0.4982922673225403,
126
- 0.49802443385124207
 
127
  ],
128
  "beta_mean": [
129
  0.09998118132352829,
@@ -132,7 +146,8 @@
132
  0.09976637363433838,
133
  0.09967698156833649,
134
  0.0996585488319397,
135
- 0.09960417449474335
 
136
  ],
137
  "w_ret": [
138
  0.0,
@@ -141,6 +156,7 @@
141
  0.0,
142
  0.03,
143
  0.06,
144
- 0.09
 
145
  ]
146
  }
 
6
  4,
7
  5,
8
  6,
9
+ 7,
10
+ 8
11
  ],
12
  "gen_loss": [
13
  18.370433433850607,
 
16
  11.843723264174027,
17
  11.67701819376512,
18
  11.95506536512664,
19
+ 11.651441534504746,
20
+ 11.484277419465961
21
  ],
22
  "ret_loss": [
23
  0.0,
 
26
  0.0,
27
  0.0,
28
  0.0,
29
+ 0.0,
30
  0.0
31
  ],
32
  "ent_loss": [
 
36
  0.6162352153026697,
37
  0.6095350569667238,
38
  0.6105213370467677,
39
+ 0.6074923021143133,
40
+ 0.606140976638505
41
  ],
42
  "ppl": [
43
  40729.60576844635,
 
46
  123.54939191255174,
47
  81.4022446898097,
48
  73.53574793147658,
49
+ 66.62547611610893,
50
+ 61.79489383359564
51
  ],
52
  "tf_acc": [
53
  9.249682110189831e-06,
 
56
  0.4409562865464462,
57
  0.4514476024551921,
58
  0.4529803291907453,
59
+ 0.4559930050639289,
60
+ 0.45953291281739334
61
  ],
62
  "fr_acc": [
63
  0.0,
 
66
  0.09257571660973458,
67
  0.1671656922337565,
68
  0.16827387097913035,
69
+ 0.1727579081837558,
70
+ 0.18450658056400712
71
  ],
72
  "def_rate": [
73
  0.0,
 
76
  0.45,
77
  1.0,
78
  1.0,
79
+ 1.0,
80
  1.0
81
  ],
82
  "mrr": [
 
86
  0.004980043042451143,
87
  0.004973841365426779,
88
  0.004973897710442543,
89
+ 0.004973262082785368,
90
+ 0.004975350573658943
91
  ],
92
  "r1": [
93
  0.0006249999860301614,
 
96
  0.0006249999860301614,
97
  0.0006249999860301614,
98
  0.0006249999860301614,
99
+ 0.0006249999860301614,
100
  0.0006249999860301614
101
  ],
102
  "ret_ok_pct": [
 
106
  0.0,
107
  0.0,
108
  0.0,
109
+ 0.0,
110
  0.0
111
  ],
112
  "grad_norm": [
 
116
  1217.5837738567411,
117
  1152.3023670419057,
118
  2138.4472111783607,
119
+ 1115.3582513533938,
120
+ 1271.3913563283284
121
  ],
122
  "step_var": [
123
  0.22542811930179596,
 
126
  0.22952058911323547,
127
  0.23098886013031006,
128
  0.23129060864448547,
129
+ 0.23215171694755554,
130
+ 0.23333927989006042
131
  ],
132
  "pos_slope": [
133
  0.49990350008010864,
 
136
  0.4988322854042053,
137
  0.4983888268470764,
138
  0.4982922673225403,
139
+ 0.49802443385124207,
140
+ 0.49764952063560486
141
  ],
142
  "beta_mean": [
143
  0.09998118132352829,
 
146
  0.09976637363433838,
147
  0.09967698156833649,
148
  0.0996585488319397,
149
+ 0.09960417449474335,
150
+ 0.09952875226736069
151
  ],
152
  "w_ret": [
153
  0.0,
 
156
  0.0,
157
  0.03,
158
  0.06,
159
+ 0.09,
160
+ 0.12
161
  ]
162
  }