File size: 3,652 Bytes
a2ca250
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
{
  "step": [
    50,
    100,
    150,
    200,
    250,
    300,
    350,
    400,
    450,
    500,
    550,
    600,
    650,
    700,
    750,
    800,
    850,
    900
  ],
  "train_loss": [
    1.229721450805664,
    1.1041190230846405,
    1.025876224040985,
    1.0216933679580689,
    0.9389291417598724,
    0.9820241594314575,
    0.971408588886261,
    0.9302374482154846,
    0.9171168172359466,
    0.921946108341217,
    0.9294362807273865,
    0.9058246970176697,
    0.8852759146690369,
    0.9285594654083252,
    0.9111053240299225,
    0.8563614284992218,
    0.8970540463924408,
    0.882376617193222
  ],
  "val_nll": [
    1.245873212814331,
    1.1079651455084483,
    1.0574054757754008,
    1.024699628353119,
    1.0064872364203135,
    0.9878634532292684,
    0.9754222611586253,
    0.9647026916344961,
    0.9550074140230814,
    0.9492202738920847,
    0.9425136148929596,
    0.93640163342158,
    0.9316958208878835,
    0.9284021159013113,
    0.9264170686403911,
    0.9249595264593761,
    0.9239107569058737,
    0.9228900790214538
  ],
  "val_ppl": [
    3.475968734949889,
    3.0281901944508567,
    2.8788919363026415,
    2.786258421829991,
    2.735973287632187,
    2.685490662172586,
    2.652286932311601,
    2.6240074011406005,
    2.598689849594626,
    2.58369429980331,
    2.5664243198423558,
    2.55078622052022,
    2.5388108976642356,
    2.530462559579264,
    2.525444454042619,
    2.521766193486182,
    2.519122828264174,
    2.516552927049002
  ],
  "lr": [
    0.00019998312416333227,
    0.0001979649067087574,
    0.00019264940672148018,
    0.00018421553219875658,
    0.0001729471487418621,
    0.00015922352526649803,
    0.00014350656864820733,
    0.00012632527695645993,
    0.00010825793454723325,
    8.991264828797319e-05,
    7.190688002264308e-05,
    5.484666416891109e-05,
    3.9306209937284346e-05,
    2.5808574716471856e-05,
    1.4808059116167305e-05,
    1e-05,
    1e-05,
    1e-05
  ],
  "grad_norm": [
    0.3591911792755127,
    0.36388659477233887,
    0.37539058923721313,
    0.3457748591899872,
    0.29278653860092163,
    0.3325034976005554,
    0.31695958971977234,
    0.31593164801597595,
    0.31353333592414856,
    0.3333532512187958,
    0.3345634937286377,
    0.31411102414131165,
    0.29149293899536133,
    0.3208323121070862,
    0.2993287742137909,
    0.30689114332199097,
    0.3200317621231079,
    0.30858248472213745
  ],
  "tok_per_sec": [
    6706.525285452902,
    6700.058062558346,
    6697.280101536737,
    6680.071604788786,
    6683.553221953783,
    6685.66879995729,
    6679.849924100408,
    6681.899978577697,
    6684.255805925504,
    6681.92172154577,
    6684.531310449166,
    6686.6788334140565,
    6684.5712078021825,
    6686.219542291029,
    6687.095210911167,
    6685.0861424049535,
    6686.302034296362,
    6687.162565026619
  ],
  "vram_gb": [
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224,
    31.77780224
  ],
  "elapsed_hr": [
    0.13572188032997978,
    0.27170577141973706,
    0.40772770815425446,
    0.5450374044312372,
    0.6809418523311614,
    0.8168716543912887,
    0.9538471115297741,
    1.089776530795627,
    1.2255665010213852,
    1.3622162308295567,
    1.4978528754578697,
    1.633496529261271,
    1.7701791963974636,
    1.9058768606848187,
    2.041743522816234,
    2.1785142697228324,
    2.314250492784712,
    2.4500675496790145
  ]
}