ilessio-aiflowlab commited on
Commit
0ff5b85
·
verified ·
1 Parent(s): ad7e9a1

Upload benchmarks/bench_03_training.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. benchmarks/bench_03_training.json +265 -0
benchmarks/bench_03_training.json ADDED
@@ -0,0 +1,265 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "benchmark": "kd_training",
3
+ "timestamp": "2026-03-19T11:54:28.894463+00:00",
4
+ "device": "NVIDIA L4",
5
+ "model": "forge-nano",
6
+ "optimizer": "AdamW",
7
+ "grad_clip": 1.0,
8
+ "run_1_lr2e4_50steps": {
9
+ "n_steps": 50,
10
+ "loss_start": 8.3049,
11
+ "loss_end": 1.9631,
12
+ "loss_min": 0.4144,
13
+ "loss_reduction_pct": 76.4,
14
+ "loss_first_10_mean": 24.1221,
15
+ "loss_last_10_mean": 1.7797,
16
+ "step_time_mean_ms": 366.8,
17
+ "step_time_std_ms": 110.5,
18
+ "step_time_p50_ms": 350.5,
19
+ "step_time_p95_ms": 357.6,
20
+ "steps_per_sec": 2.73,
21
+ "total_time_s": 18.3,
22
+ "gpu_mem_peak_gb": 9.65,
23
+ "loss_curve": [
24
+ 8.3049,
25
+ 91.3748,
26
+ 22.7864,
27
+ 100.3036,
28
+ 6.4863,
29
+ 1.8932,
30
+ 5.1797,
31
+ 2.4485,
32
+ 1.5367,
33
+ 0.9069,
34
+ 2.0219,
35
+ 2.19,
36
+ 2.6092,
37
+ 3.797,
38
+ 1.3194,
39
+ 0.4144,
40
+ 0.6227,
41
+ 1.3961,
42
+ 1.9846,
43
+ 1.3349,
44
+ 3.9967,
45
+ 2.4535,
46
+ 2.7646,
47
+ 4.1622,
48
+ 3.9146,
49
+ 1.3404,
50
+ 1.2876,
51
+ 3.0286,
52
+ 1.2856,
53
+ 1.5534,
54
+ 1.2389,
55
+ 2.0355,
56
+ 2.3023,
57
+ 2.7555,
58
+ 1.4107,
59
+ 1.1905,
60
+ 2.2219,
61
+ 1.3844,
62
+ 0.429,
63
+ 0.593,
64
+ 0.6824,
65
+ 2.0748,
66
+ 1.9094,
67
+ 1.6577,
68
+ 1.3618,
69
+ 2.5235,
70
+ 1.7971,
71
+ 2.1732,
72
+ 1.6541,
73
+ 1.9631
74
+ ],
75
+ "lr": 0.0002
76
+ },
77
+ "run_2_lr5e4_50steps": {
78
+ "n_steps": 50,
79
+ "loss_start": 6.7827,
80
+ "loss_end": 1.3755,
81
+ "loss_min": 0.4417,
82
+ "loss_reduction_pct": 79.7,
83
+ "loss_first_10_mean": 19.092,
84
+ "loss_last_10_mean": 1.9989,
85
+ "step_time_mean_ms": 354.8,
86
+ "step_time_std_ms": 7.8,
87
+ "step_time_p50_ms": 352.3,
88
+ "step_time_p95_ms": 374.3,
89
+ "steps_per_sec": 2.82,
90
+ "total_time_s": 17.7,
91
+ "gpu_mem_peak_gb": 14.97,
92
+ "loss_curve": [
93
+ 6.7827,
94
+ 101.8204,
95
+ 42.7009,
96
+ 22.8225,
97
+ 5.315,
98
+ 1.8645,
99
+ 3.7638,
100
+ 2.9647,
101
+ 1.3539,
102
+ 1.5311,
103
+ 3.3165,
104
+ 5.2206,
105
+ 3.9817,
106
+ 2.5642,
107
+ 1.7403,
108
+ 2.0605,
109
+ 3.2802,
110
+ 2.5078,
111
+ 2.1435,
112
+ 1.4227,
113
+ 1.4168,
114
+ 1.3798,
115
+ 0.8019,
116
+ 1.7231,
117
+ 1.5066,
118
+ 0.4417,
119
+ 2.0965,
120
+ 1.448,
121
+ 1.0429,
122
+ 2.2694,
123
+ 1.3545,
124
+ 3.3713,
125
+ 4.234,
126
+ 1.9851,
127
+ 2.2198,
128
+ 3.6816,
129
+ 1.9721,
130
+ 1.2497,
131
+ 1.7489,
132
+ 1.1938,
133
+ 2.6041,
134
+ 2.2241,
135
+ 2.243,
136
+ 2.0544,
137
+ 2.7285,
138
+ 3.8225,
139
+ 1.0744,
140
+ 0.9204,
141
+ 0.9423,
142
+ 1.3755
143
+ ],
144
+ "lr": 0.0005
145
+ },
146
+ "run_3_lr2e4_100steps": {
147
+ "n_steps": 100,
148
+ "loss_start": 14.3952,
149
+ "loss_end": 1.012,
150
+ "loss_min": 0.4931,
151
+ "loss_reduction_pct": 93.0,
152
+ "loss_first_10_mean": 19.4893,
153
+ "loss_last_10_mean": 1.5553,
154
+ "step_time_mean_ms": 352.4,
155
+ "step_time_std_ms": 5.7,
156
+ "step_time_p50_ms": 350.9,
157
+ "step_time_p95_ms": 360.9,
158
+ "steps_per_sec": 2.84,
159
+ "total_time_s": 35.2,
160
+ "gpu_mem_peak_gb": 20.29,
161
+ "loss_curve": [
162
+ 14.3952,
163
+ 76.3616,
164
+ 64.1362,
165
+ 2.7626,
166
+ 18.884,
167
+ 5.4128,
168
+ 10.6415,
169
+ 0.9251,
170
+ 0.7577,
171
+ 0.6167,
172
+ 2.7718,
173
+ 2.1239,
174
+ 1.3505,
175
+ 2.7245,
176
+ 2.1935,
177
+ 1.1396,
178
+ 2.7094,
179
+ 0.6373,
180
+ 1.4863,
181
+ 1.2989,
182
+ 2.3638,
183
+ 0.6327,
184
+ 1.136,
185
+ 1.5452,
186
+ 0.4931,
187
+ 1.5772,
188
+ 0.9071,
189
+ 1.362,
190
+ 1.3342,
191
+ 2.1487,
192
+ 1.2072,
193
+ 2.0984,
194
+ 1.3063,
195
+ 0.9049,
196
+ 2.2391,
197
+ 1.4513,
198
+ 3.1519,
199
+ 1.0175,
200
+ 1.4259,
201
+ 1.0024,
202
+ 0.698,
203
+ 1.538,
204
+ 2.7462,
205
+ 1.3369,
206
+ 0.6757,
207
+ 1.633,
208
+ 1.0496,
209
+ 2.7979,
210
+ 2.0111,
211
+ 3.2578,
212
+ 1.1755,
213
+ 1.4229,
214
+ 4.5469,
215
+ 1.0312,
216
+ 1.0638,
217
+ 2.2574,
218
+ 1.4536,
219
+ 2.3245,
220
+ 3.8574,
221
+ 0.665,
222
+ 0.6479,
223
+ 3.3828,
224
+ 2.3435,
225
+ 1.0186,
226
+ 0.6663,
227
+ 0.9571,
228
+ 1.7324,
229
+ 1.4941,
230
+ 1.5548,
231
+ 2.4475,
232
+ 0.9738,
233
+ 1.2276,
234
+ 2.8808,
235
+ 0.9923,
236
+ 1.0263,
237
+ 0.5958,
238
+ 1.4596,
239
+ 4.775,
240
+ 1.7246,
241
+ 2.4754,
242
+ 2.1957,
243
+ 0.6558,
244
+ 1.402,
245
+ 1.202,
246
+ 4.1727,
247
+ 3.1152,
248
+ 1.1338,
249
+ 1.0413,
250
+ 0.6425,
251
+ 2.2472,
252
+ 1.2499,
253
+ 1.6737,
254
+ 1.0656,
255
+ 1.3808,
256
+ 0.6704,
257
+ 0.8631,
258
+ 2.9209,
259
+ 3.0871,
260
+ 1.629,
261
+ 1.012
262
+ ],
263
+ "lr": 0.0002
264
+ }
265
+ }