opt-2.7b-int4-SS-F / quant_log.csv
iproskurina's picture
Add files using upload-large-folder tool
150bdd2 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00394990,0.01000,1.281
0,self_attn.v_proj,0.00102141,0.01000,1.273
0,self_attn.q_proj,0.00392392,0.01000,1.275
0,self_attn.out_proj,0.00003452,0.01000,1.292
0,fc1,0.01215448,0.01000,1.291
0,fc2,0.00012052,0.01000,5.352
1,self_attn.k_proj,0.01467542,0.01000,1.241
1,self_attn.v_proj,0.00038407,0.01000,1.264
1,self_attn.q_proj,0.00410239,0.01000,1.281
1,self_attn.out_proj,0.00000663,0.01000,1.252
1,fc1,0.00909016,0.01000,1.273
1,fc2,0.00009310,0.01000,5.235
2,self_attn.k_proj,0.01546464,0.01000,1.281
2,self_attn.v_proj,0.00049482,0.01000,1.238
2,self_attn.q_proj,0.00585759,0.01000,1.243
2,self_attn.out_proj,0.00000087,0.01000,1.237
2,fc1,0.00996129,0.01000,1.262
2,fc2,0.00008796,0.01000,5.313
3,self_attn.k_proj,0.00665643,0.01000,1.236
3,self_attn.v_proj,0.00061016,0.01000,1.249
3,self_attn.q_proj,0.00416894,0.01000,1.287
3,self_attn.out_proj,0.00000125,0.01000,1.231
3,fc1,0.00974267,0.01000,1.294
3,fc2,0.00008339,0.01000,5.251
4,self_attn.k_proj,0.00921630,0.01000,1.243
4,self_attn.v_proj,0.00083335,0.01000,1.250
4,self_attn.q_proj,0.00537768,0.01000,1.279
4,self_attn.out_proj,0.00000241,0.01000,1.244
4,fc1,0.00916280,0.01000,1.286
4,fc2,0.00009056,0.01000,5.330
5,self_attn.k_proj,0.00837081,0.01000,1.257
5,self_attn.v_proj,0.00097881,0.01000,1.252
5,self_attn.q_proj,0.00573123,0.01000,1.255
5,self_attn.out_proj,0.00000650,0.01000,1.254
5,fc1,0.01018309,0.01000,1.269
5,fc2,0.00009399,0.01000,5.325
6,self_attn.k_proj,0.00624802,0.01000,1.236
6,self_attn.v_proj,0.00120398,0.01000,1.253
6,self_attn.q_proj,0.00635306,0.01000,1.268
6,self_attn.out_proj,0.00000861,0.01000,1.251
6,fc1,0.01157868,0.01000,1.280
6,fc2,0.00011119,0.01000,5.292
7,self_attn.k_proj,0.00673938,0.01000,1.269
7,self_attn.v_proj,0.00140799,0.01000,1.324
7,self_attn.q_proj,0.00758268,0.01000,1.260
7,self_attn.out_proj,0.00001078,0.01000,1.265
7,fc1,0.01286504,0.01000,1.262
7,fc2,0.00011152,0.01000,5.347
8,self_attn.k_proj,0.01198061,0.01000,1.231
8,self_attn.v_proj,0.00181584,0.01000,1.246
8,self_attn.q_proj,0.00865953,0.01000,1.271
8,self_attn.out_proj,0.00001939,0.01000,1.240
8,fc1,0.01473213,0.01000,1.249
8,fc2,0.00013096,0.01000,5.281
9,self_attn.k_proj,0.01012673,0.01000,1.239
9,self_attn.v_proj,0.00216779,0.01000,1.252
9,self_attn.q_proj,0.00914032,0.01000,1.257
9,self_attn.out_proj,0.00002055,0.01000,1.243
9,fc1,0.01706153,0.01000,1.261
9,fc2,0.00015577,0.01000,5.270
10,self_attn.k_proj,0.01118829,0.01000,1.285
10,self_attn.v_proj,0.00250398,0.01000,1.257
10,self_attn.q_proj,0.01054306,0.01000,1.280
10,self_attn.out_proj,0.00003266,0.01000,1.242
10,fc1,0.02150265,0.01000,1.281
10,fc2,0.00022845,0.01000,5.320
11,self_attn.k_proj,0.01217411,0.01000,1.240
11,self_attn.v_proj,0.00297503,0.01000,1.237
11,self_attn.q_proj,0.01163996,0.01000,1.261
11,self_attn.out_proj,0.00003680,0.01000,1.256
11,fc1,0.02571280,0.01000,1.285
11,fc2,0.00023919,0.01000,5.303
12,self_attn.k_proj,0.01357361,0.01000,1.248
12,self_attn.v_proj,0.00355875,0.01000,1.231
12,self_attn.q_proj,0.01265827,0.01000,1.275
12,self_attn.out_proj,0.00004796,0.01000,1.244
12,fc1,0.03000994,0.01000,1.269
12,fc2,0.00029458,0.01000,5.289
13,self_attn.k_proj,0.01616533,0.01000,1.249
13,self_attn.v_proj,0.00403290,0.01000,1.255
13,self_attn.q_proj,0.01485024,0.01000,1.244
13,self_attn.out_proj,0.00008728,0.01000,1.243
13,fc1,0.03540917,0.01000,1.286
13,fc2,0.00037594,0.01000,5.299
14,self_attn.k_proj,0.01755567,0.01000,1.273
14,self_attn.v_proj,0.00486799,0.01000,1.248
14,self_attn.q_proj,0.01594050,0.01000,1.274
14,self_attn.out_proj,0.00009562,0.01000,1.223
14,fc1,0.04057390,0.01000,1.283
14,fc2,0.00049239,0.01000,5.391
15,self_attn.k_proj,0.02163056,0.01000,1.265
15,self_attn.v_proj,0.00555094,0.01000,1.258
15,self_attn.q_proj,0.01904528,0.01000,1.258
15,self_attn.out_proj,0.00018198,0.01000,1.247
15,fc1,0.04487120,0.01000,1.278
15,fc2,0.00063424,0.01000,5.313
16,self_attn.k_proj,0.02287876,0.01000,1.273
16,self_attn.v_proj,0.00654785,0.01000,1.244
16,self_attn.q_proj,0.01999130,0.01000,1.257
16,self_attn.out_proj,0.00021466,0.01000,1.263
16,fc1,0.04983628,0.01000,1.271
16,fc2,0.00108457,0.01000,5.294
17,self_attn.k_proj,0.02326965,0.01000,1.276
17,self_attn.v_proj,0.00799770,0.01000,1.247
17,self_attn.q_proj,0.01995130,0.01000,1.271
17,self_attn.out_proj,0.00025417,0.01000,1.309
17,fc1,0.05527238,0.01000,1.273
17,fc2,0.00139859,0.01000,5.297
18,self_attn.k_proj,0.02433346,0.01000,1.252
18,self_attn.v_proj,0.00959834,0.01000,1.235
18,self_attn.q_proj,0.02166979,0.01000,1.241
18,self_attn.out_proj,0.00027066,0.01000,1.227
18,fc1,0.06184222,0.01000,1.286
18,fc2,0.00186334,0.01000,5.241
19,self_attn.k_proj,0.02368311,0.01000,1.249
19,self_attn.v_proj,0.01161100,0.01000,1.237
19,self_attn.q_proj,0.01947075,0.01000,1.247
19,self_attn.out_proj,0.00037949,0.01000,1.253
19,fc1,0.07012071,0.01000,1.283
19,fc2,0.00237346,0.01000,5.274
20,self_attn.k_proj,0.02460291,0.01000,1.267
20,self_attn.v_proj,0.01390896,0.01000,1.280
20,self_attn.q_proj,0.02117208,0.01000,1.262
20,self_attn.out_proj,0.00036344,0.01000,1.269
20,fc1,0.07792345,0.01000,1.291
20,fc2,0.00293787,0.01000,5.260
21,self_attn.k_proj,0.02349118,0.01000,1.253
21,self_attn.v_proj,0.01582944,0.01000,1.245
21,self_attn.q_proj,0.02149881,0.01000,1.270
21,self_attn.out_proj,0.00039286,0.01000,1.250
21,fc1,0.08261187,0.01000,1.267
21,fc2,0.00354288,0.01000,5.303
22,self_attn.k_proj,0.02509292,0.01000,1.271
22,self_attn.v_proj,0.01692703,0.01000,1.250
22,self_attn.q_proj,0.02045271,0.01000,1.255
22,self_attn.out_proj,0.00058325,0.01000,1.254
22,fc1,0.09038876,0.01000,1.282
22,fc2,0.00433740,0.01000,5.283
23,self_attn.k_proj,0.02301701,0.01000,1.267
23,self_attn.v_proj,0.01848015,0.01000,1.240
23,self_attn.q_proj,0.02106069,0.01000,1.249
23,self_attn.out_proj,0.00045746,0.01000,1.267
23,fc1,0.09600659,0.01000,1.304
23,fc2,0.00485786,0.01000,5.352
24,self_attn.k_proj,0.02274082,0.01000,1.270
24,self_attn.v_proj,0.02127173,0.01000,1.272
24,self_attn.q_proj,0.02076919,0.01000,1.274
24,self_attn.out_proj,0.00078850,0.01000,1.243
24,fc1,0.10268364,0.01000,1.260
24,fc2,0.00595228,0.01000,5.299
25,self_attn.k_proj,0.02236036,0.01000,1.251
25,self_attn.v_proj,0.02580946,0.01000,1.248
25,self_attn.q_proj,0.02157809,0.01000,1.273
25,self_attn.out_proj,0.00091601,0.01000,1.259
25,fc1,0.10824930,0.01000,1.278
25,fc2,0.00661862,0.01000,5.325
26,self_attn.k_proj,0.02290183,0.01000,1.270
26,self_attn.v_proj,0.02645369,0.01000,1.247
26,self_attn.q_proj,0.02129553,0.01000,1.260
26,self_attn.out_proj,0.00105756,0.01000,1.288
26,fc1,0.11557976,0.01000,1.267
26,fc2,0.00827897,0.01000,5.285
27,self_attn.k_proj,0.02248514,0.01000,1.253
27,self_attn.v_proj,0.02992377,0.01000,1.254
27,self_attn.q_proj,0.02264811,0.01000,1.245
27,self_attn.out_proj,0.00074538,0.01000,1.261
27,fc1,0.11797357,0.01000,1.286
27,fc2,0.00943409,0.01000,5.300
28,self_attn.k_proj,0.02341844,0.01000,1.267
28,self_attn.v_proj,0.03110846,0.01000,1.236
28,self_attn.q_proj,0.02293959,0.01000,1.241
28,self_attn.out_proj,0.00141534,0.01000,1.255
28,fc1,0.12168028,0.01000,1.268
28,fc2,0.01113645,0.01000,5.277
29,self_attn.k_proj,0.02414644,0.01000,1.235
29,self_attn.v_proj,0.03360369,0.01000,1.268
29,self_attn.q_proj,0.02726843,0.01000,1.276
29,self_attn.out_proj,0.00087671,0.01000,1.250
29,fc1,0.11952688,0.01000,1.281
29,fc2,0.01210173,0.01000,5.320
30,self_attn.k_proj,0.02478706,0.01000,1.243
30,self_attn.v_proj,0.03503960,0.01000,1.243
30,self_attn.q_proj,0.02936129,0.01000,1.239
30,self_attn.out_proj,0.00060751,0.01000,1.268
30,fc1,0.11692072,0.01000,1.263
30,fc2,0.01395721,0.01000,5.274
31,self_attn.k_proj,0.02395790,0.01000,1.259
31,self_attn.v_proj,0.03193032,0.01000,1.255
31,self_attn.q_proj,0.03179608,0.01000,1.267
31,self_attn.out_proj,0.00154203,0.01000,1.242
31,fc1,0.10718785,0.01000,1.273
31,fc2,0.00861030,0.01000,5.303