wuff-mann commited on
Commit
7b64570
·
verified ·
1 Parent(s): 75881ec

Upload sigma_lambda_v5/history.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. sigma_lambda_v5/history.json +20 -8
sigma_lambda_v5/history.json CHANGED
@@ -3,72 +3,84 @@
3
  1,
4
  2,
5
  3,
6
- 4
 
7
  ],
8
  "gen_loss": [
9
  16.586591267879488,
10
  22.012301083468923,
11
  50.61838954157162,
12
- 114.44467188566325
 
13
  ],
14
  "ret_loss": [
15
  0.0,
16
  0.0,
17
  0.0,
 
18
  0.0
19
  ],
20
  "ppl": [
21
  89.82908441173188,
22
  160.04577946159412,
23
  15470.654177938472,
 
24
  485165195.4097903
25
  ],
26
  "tf_acc": [
27
  0.46026214386231185,
28
  0.47643615492864355,
29
  0.47478209936121774,
30
- 0.4664326184178535
 
31
  ],
32
  "fr_acc": [
33
  0.12302286153389094,
34
  0.11233910085013026,
35
  0.24578219982631747,
36
- 0.2376122651857946
 
37
  ],
38
  "mrr": [
39
  0.006059600971639156,
40
  0.006043825298547745,
41
  0.006044529378414154,
42
- 0.006051086820662022
 
43
  ],
44
  "r1": [
45
  0.0007812500116415322,
46
  0.0007812500116415322,
47
  0.0007812500116415322,
 
48
  0.0007812500116415322
49
  ],
50
  "step_var": [
51
  0.16505937278270721,
52
  0.18193045258522034,
53
  0.20552654564380646,
54
- 0.23860830068588257
 
55
  ],
56
  "pos_slope": [
57
  0.4985616207122803,
58
  0.4935553967952728,
59
  0.48772382736206055,
60
- 0.48204389214515686
 
61
  ],
62
  "grad_norm": [
63
  NaN,
64
  NaN,
65
  NaN,
 
66
  NaN
67
  ],
68
  "w_ret": [
69
  0.0,
70
  0.0,
71
  0.0,
72
- 0.01
 
73
  ]
74
  }
 
3
  1,
4
  2,
5
  3,
6
+ 4,
7
+ 5
8
  ],
9
  "gen_loss": [
10
  16.586591267879488,
11
  22.012301083468923,
12
  50.61838954157162,
13
+ 114.44467188566325,
14
+ 205.98175486637822
15
  ],
16
  "ret_loss": [
17
  0.0,
18
  0.0,
19
  0.0,
20
+ 0.0,
21
  0.0
22
  ],
23
  "ppl": [
24
  89.82908441173188,
25
  160.04577946159412,
26
  15470.654177938472,
27
+ 485165195.4097903,
28
  485165195.4097903
29
  ],
30
  "tf_acc": [
31
  0.46026214386231185,
32
  0.47643615492864355,
33
  0.47478209936121774,
34
+ 0.4664326184178535,
35
+ 0.4302312730702071
36
  ],
37
  "fr_acc": [
38
  0.12302286153389094,
39
  0.11233910085013026,
40
  0.24578219982631747,
41
+ 0.2376122651857946,
42
+ 0.13397800116550115
43
  ],
44
  "mrr": [
45
  0.006059600971639156,
46
  0.006043825298547745,
47
  0.006044529378414154,
48
+ 0.006051086820662022,
49
+ 0.006043311208486557
50
  ],
51
  "r1": [
52
  0.0007812500116415322,
53
  0.0007812500116415322,
54
  0.0007812500116415322,
55
+ 0.0007812500116415322,
56
  0.0007812500116415322
57
  ],
58
  "step_var": [
59
  0.16505937278270721,
60
  0.18193045258522034,
61
  0.20552654564380646,
62
+ 0.23860830068588257,
63
+ 0.2775871157646179
64
  ],
65
  "pos_slope": [
66
  0.4985616207122803,
67
  0.4935553967952728,
68
  0.48772382736206055,
69
+ 0.48204389214515686,
70
+ 0.47680673003196716
71
  ],
72
  "grad_norm": [
73
  NaN,
74
  NaN,
75
  NaN,
76
+ NaN,
77
  NaN
78
  ],
79
  "w_ret": [
80
  0.0,
81
  0.0,
82
  0.0,
83
+ 0.01,
84
+ 0.02
85
  ]
86
  }