wuff-mann commited on
Commit
491357b
·
verified ·
1 Parent(s): 77c11e3

Upload sigma_lambda_v6/history.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. sigma_lambda_v6/history.json +22 -10
sigma_lambda_v6/history.json CHANGED
@@ -3,72 +3,84 @@
3
  1,
4
  2,
5
  3,
6
- 4
 
7
  ],
8
  "gen_loss": [
9
  16.730865429819772,
10
  10.815642579259727,
11
  11.253040295459758,
12
- 12.599300429961511
 
13
  ],
14
  "ret_loss": [
15
  0.0,
16
  0.0,
17
  0.0,
 
18
  0.0
19
  ],
20
  "ppl": [
21
  275.9590614528296,
22
  38.05776687300114,
23
  32.30925492774381,
24
- 35.023953072291675
 
25
  ],
26
  "tf_acc": [
27
  0.4522865752576864,
28
  0.484411723533269,
29
  0.49136870335305427,
30
- 0.4924278146573637
 
31
  ],
32
  "fr_acc": [
33
  0.12302286153389094,
34
  0.10218952820055761,
35
  0.23302846051007814,
36
- 0.25665842531651356
 
37
  ],
38
  "mrr": [
39
  0.006079697050154209,
40
  0.00607482623308897,
41
  0.0060824002139270306,
42
- 0.006060858257114887
 
43
  ],
44
  "r1": [
45
  0.0007812500116415322,
46
  0.0007812500116415322,
47
  0.0007812500116415322,
 
48
  0.0007812500116415322
49
  ],
50
  "step_var": [
51
  0.1615130603313446,
52
  0.1678009033203125,
53
  0.17375488579273224,
54
- 0.17968906462192535
 
55
  ],
56
  "pos_slope": [
57
  0.49914172291755676,
58
  0.4964430332183838,
59
  0.4936324656009674,
60
- 0.49108341336250305
 
61
  ],
62
  "grad_norm": [
63
  NaN,
64
  NaN,
65
  NaN,
66
- NaN
 
67
  ],
68
  "w_ret": [
69
  0.0,
70
  0.0,
71
  0.0,
72
- 0.01
 
73
  ]
74
  }
 
3
  1,
4
  2,
5
  3,
6
+ 4,
7
+ 5
8
  ],
9
  "gen_loss": [
10
  16.730865429819772,
11
  10.815642579259727,
12
  11.253040295459758,
13
+ 12.599300429961511,
14
+ 15.0517748842187
15
  ],
16
  "ret_loss": [
17
  0.0,
18
  0.0,
19
  0.0,
20
+ 0.0,
21
  0.0
22
  ],
23
  "ppl": [
24
  275.9590614528296,
25
  38.05776687300114,
26
  32.30925492774381,
27
+ 35.023953072291675,
28
+ 45.514587863029114
29
  ],
30
  "tf_acc": [
31
  0.4522865752576864,
32
  0.484411723533269,
33
  0.49136870335305427,
34
+ 0.4924278146573637,
35
+ 0.4915731578831036
36
  ],
37
  "fr_acc": [
38
  0.12302286153389094,
39
  0.10218952820055761,
40
  0.23302846051007814,
41
+ 0.25665842531651356,
42
+ 0.20978342531651356
43
  ],
44
  "mrr": [
45
  0.006079697050154209,
46
  0.00607482623308897,
47
  0.0060824002139270306,
48
+ 0.006060858257114887,
49
+ 0.006081360392272472
50
  ],
51
  "r1": [
52
  0.0007812500116415322,
53
  0.0007812500116415322,
54
  0.0007812500116415322,
55
+ 0.0007812500116415322,
56
  0.0007812500116415322
57
  ],
58
  "step_var": [
59
  0.1615130603313446,
60
  0.1678009033203125,
61
  0.17375488579273224,
62
+ 0.17968906462192535,
63
+ 0.1862482726573944
64
  ],
65
  "pos_slope": [
66
  0.49914172291755676,
67
  0.4964430332183838,
68
  0.4936324656009674,
69
+ 0.49108341336250305,
70
+ 0.48867347836494446
71
  ],
72
  "grad_norm": [
73
  NaN,
74
  NaN,
75
  NaN,
76
+ NaN,
77
+ Infinity
78
  ],
79
  "w_ret": [
80
  0.0,
81
  0.0,
82
  0.0,
83
+ 0.01,
84
+ 0.02
85
  ]
86
  }