diff --git "a/quantization_index.json" "b/quantization_index.json" new file mode 100644--- /dev/null +++ "b/quantization_index.json" @@ -0,0 +1,92567 @@ +{ + "model_id": "zai-org/GLM-4.7-Flash", + "quantization": { + "method": "trellis_cuda", + "min_bits": 2, + "max_bits": 8, + "group_size": 128, + "effective_bits": 3.7848377517799006 + }, + "statistics": { + "total_tensors": 9254, + "successful": 9254, + "failed": 0, + "total_params": 29308747776, + "avg_mse": 0.0002232240694604069, + "total_time_sec": 110.36988474000009, + "bit_distribution": { + "2b": 2736, + "3b": 2710, + "4b": 575, + "5b": 196, + "6b": 3037 + } + }, + "layers": [ + { + "name": "model.layers.0.mlp.down_proj.weight", + "shape": [ + 2048, + 10240 + ], + "bits": 5, + "mse": 3.0065662031120155e-06, + "sensitivity": 2.0979309245857647 + }, + { + "name": "model.layers.0.mlp.gate_proj.weight", + "shape": [ + 10240, + 2048 + ], + "bits": 6, + "mse": 8.390748007514048e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.0.mlp.up_proj.weight", + "shape": [ + 10240, + 2048 + ], + "bits": 3, + "mse": 7.702448056079447e-05, + "sensitivity": 1.153642657995318 + }, + { + "name": "model.layers.0.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 5.357392637961311e-06, + "sensitivity": 2.1543192625786647 + }, + { + "name": "model.layers.0.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 5, + "mse": 7.915920832601842e-06, + "sensitivity": 2.2066540899914355 + }, + { + "name": "model.layers.0.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 4.408653239806881e-06, + "sensitivity": 1.9473644949828508 + }, + { + "name": "model.layers.0.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 2.355716424062848e-05, + "sensitivity": 0.9940753678023229 + }, + { + "name": "model.layers.0.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 5, + "mse": 9.121675248024985e-06, + "sensitivity": 2.180818978882941 + }, + { + "name": "model.layers.1.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.945580414845608e-05, + "sensitivity": 1.05633246261043 + }, + { + "name": "model.layers.1.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.088716304475383e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000706042570527643, + "sensitivity": 0.5329304776870476 + }, + { + "name": "model.layers.1.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8707199059426785e-05, + "sensitivity": 1.1509562616551563 + }, + { + "name": "model.layers.1.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.304556106646487e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.94214686518535e-05, + "sensitivity": 0.7511464235585992 + }, + { + "name": "model.layers.1.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.208647391758859e-05, + "sensitivity": 0.9750583685936092 + }, + { + "name": "model.layers.1.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.202154168022389e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007012628484517336, + "sensitivity": 0.5736765453445599 + }, + { + "name": "model.layers.1.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.852015965501778e-05, + "sensitivity": 0.6750553503787329 + }, + { + "name": "model.layers.1.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.074311045267677e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007069016573950648, + "sensitivity": 0.5116522315040535 + }, + { + "name": "model.layers.1.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.1475853979354724e-05, + "sensitivity": 1.0840733054978677 + }, + { + "name": "model.layers.1.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.388847057474777e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5915821576491e-05, + "sensitivity": 0.9136558228696315 + }, + { + "name": "model.layers.1.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.772859731223434e-05, + "sensitivity": 0.7332689229887623 + }, + { + "name": "model.layers.1.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.858658482793544e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006789648323319852, + "sensitivity": 0.5273672147108106 + }, + { + "name": "model.layers.1.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.021194712957367e-05, + "sensitivity": 0.9322568931511268 + }, + { + "name": "model.layers.1.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.647094323852798e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007528256392106414, + "sensitivity": 0.5464896467410008 + }, + { + "name": "model.layers.1.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9081932704430073e-05, + "sensitivity": 0.6288406834657645 + }, + { + "name": "model.layers.1.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.231706493053935e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007251184433698654, + "sensitivity": 0.5298342810057413 + }, + { + "name": "model.layers.1.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006876597180962563, + "sensitivity": 0.5478110312226175 + }, + { + "name": "model.layers.1.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.369790526150609e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007398161105811596, + "sensitivity": 0.542743823874873 + }, + { + "name": "model.layers.1.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006861464935354888, + "sensitivity": 0.556595269158572 + }, + { + "name": "model.layers.1.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.273803023759683e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007265096064656973, + "sensitivity": 0.5431470246513287 + }, + { + "name": "model.layers.1.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.926963684847578e-06, + "sensitivity": 1.5297450242053912 + }, + { + "name": "model.layers.1.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.700816245735041e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.883780977455899e-05, + "sensitivity": 0.6514522296068361 + }, + { + "name": "model.layers.1.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.366184970829636e-05, + "sensitivity": 0.7059876012078068 + }, + { + "name": "model.layers.1.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.651163175774855e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007717191474512219, + "sensitivity": 0.5432075135849723 + }, + { + "name": "model.layers.1.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6457949540345e-05, + "sensitivity": 0.6700653032618367 + }, + { + "name": "model.layers.1.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.894651167182019e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006909866351634264, + "sensitivity": 0.5315274682237326 + }, + { + "name": "model.layers.1.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.778695049230009e-05, + "sensitivity": 0.6743638645954556 + }, + { + "name": "model.layers.1.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.989932105876505e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.222042429726571e-05, + "sensitivity": 0.6076999462716999 + }, + { + "name": "model.layers.1.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.088727241149172e-05, + "sensitivity": 0.9293144556174866 + }, + { + "name": "model.layers.1.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.083968054961588e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.57602577120997e-05, + "sensitivity": 0.6125585061286023 + }, + { + "name": "model.layers.1.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8775298384716734e-05, + "sensitivity": 0.6269297842135456 + }, + { + "name": "model.layers.1.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.936102181498427e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007491018623113632, + "sensitivity": 0.5717816080186022 + }, + { + "name": "model.layers.1.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.712389247491956e-05, + "sensitivity": 0.6017964557839103 + }, + { + "name": "model.layers.1.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.992279739075457e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006939051672816277, + "sensitivity": 0.5351029455097621 + }, + { + "name": "model.layers.1.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0345183909521438e-05, + "sensitivity": 1.2175160671256555 + }, + { + "name": "model.layers.1.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.800407052447554e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006646983092650771, + "sensitivity": 0.5437498645340249 + }, + { + "name": "model.layers.1.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0325789844500832e-05, + "sensitivity": 1.602549990546906 + }, + { + "name": "model.layers.1.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.76636580262857e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006699999212287366, + "sensitivity": 0.5617565518374802 + }, + { + "name": "model.layers.1.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.663551200996153e-05, + "sensitivity": 0.8011861740161235 + }, + { + "name": "model.layers.1.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.255478410821524e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.39556092210114e-05, + "sensitivity": 0.8260173891625407 + }, + { + "name": "model.layers.1.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.867027721251361e-05, + "sensitivity": 0.839696167916931 + }, + { + "name": "model.layers.1.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.474218707808177e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007384248310700059, + "sensitivity": 0.5318172552201543 + }, + { + "name": "model.layers.1.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 7.762881068629213e-06, + "sensitivity": 1.3919723737977423 + }, + { + "name": "model.layers.1.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.743935045960825e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.287332507781684e-05, + "sensitivity": 0.6382699162946295 + }, + { + "name": "model.layers.1.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0072743508499116e-05, + "sensitivity": 0.6848972557441011 + }, + { + "name": "model.layers.1.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.227509175005252e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007216193480417132, + "sensitivity": 0.5585915304281914 + }, + { + "name": "model.layers.1.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.212219886947423e-05, + "sensitivity": 0.6404290906497698 + }, + { + "name": "model.layers.1.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.451672334151226e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007516718469560146, + "sensitivity": 0.5154440675940664 + }, + { + "name": "model.layers.1.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006734145572409034, + "sensitivity": 0.5789922620595601 + }, + { + "name": "model.layers.1.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.244005135158659e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007194909267127514, + "sensitivity": 0.506542767829843 + }, + { + "name": "model.layers.1.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.710440382244997e-05, + "sensitivity": 0.7785803883817267 + }, + { + "name": "model.layers.1.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.073648819437949e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006898684659972787, + "sensitivity": 0.5033169345189182 + }, + { + "name": "model.layers.1.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.526108361664228e-05, + "sensitivity": 0.8204644621674357 + }, + { + "name": "model.layers.1.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.831716407556087e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006732492474839091, + "sensitivity": 0.5535000565800609 + }, + { + "name": "model.layers.1.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.136714364401996e-05, + "sensitivity": 1.062624637754448 + }, + { + "name": "model.layers.1.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.516017947433284e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007479293271899223, + "sensitivity": 0.5805955468164434 + }, + { + "name": "model.layers.1.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6859156757127494e-05, + "sensitivity": 0.6684237266059603 + }, + { + "name": "model.layers.1.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.885818836759427e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006734858034178615, + "sensitivity": 0.5321618340896571 + }, + { + "name": "model.layers.1.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.288357351673767e-05, + "sensitivity": 0.9988061100013048 + }, + { + "name": "model.layers.1.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.394538220571121e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006305475253611803, + "sensitivity": 0.5114646678925123 + }, + { + "name": "model.layers.1.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.948065881966613e-05, + "sensitivity": 0.871043374315495 + }, + { + "name": "model.layers.1.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.139675861049909e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007124726544134319, + "sensitivity": 0.5409620875025165 + }, + { + "name": "model.layers.1.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.167671381263062e-05, + "sensitivity": 0.9436389842736912 + }, + { + "name": "model.layers.1.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.399570793291787e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007443134090863168, + "sensitivity": 0.5187434612131631 + }, + { + "name": "model.layers.1.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.017141276970506e-05, + "sensitivity": 0.7414642847630519 + }, + { + "name": "model.layers.1.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.187839289850672e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007151130121201277, + "sensitivity": 0.5954510689508186 + }, + { + "name": "model.layers.1.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007028746185824275, + "sensitivity": 0.5657199560715326 + }, + { + "name": "model.layers.1.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.586002427866333e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007675624219700694, + "sensitivity": 0.5063895863360861 + }, + { + "name": "model.layers.1.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.203779048519209e-05, + "sensitivity": 0.7285713972900425 + }, + { + "name": "model.layers.1.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.577242857019883e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007657792302779853, + "sensitivity": 0.5350005813599398 + }, + { + "name": "model.layers.1.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.045118789188564e-05, + "sensitivity": 0.6051168168531535 + }, + { + "name": "model.layers.1.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.327325081656454e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007333098910748959, + "sensitivity": 0.5718397820387567 + }, + { + "name": "model.layers.1.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006814757362008095, + "sensitivity": 0.5902750491594287 + }, + { + "name": "model.layers.1.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.376571946020704e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007336141425184906, + "sensitivity": 0.5272879368864146 + }, + { + "name": "model.layers.1.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0309031495125964e-05, + "sensitivity": 1.2275653482163982 + }, + { + "name": "model.layers.1.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.168316074057657e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.058573490008712e-05, + "sensitivity": 0.8601511940648492 + }, + { + "name": "model.layers.1.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8852114307228476e-05, + "sensitivity": 0.7027394093461021 + }, + { + "name": "model.layers.1.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.216733936525998e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007218911778181791, + "sensitivity": 0.5486119794567152 + }, + { + "name": "model.layers.1.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.813718235003762e-05, + "sensitivity": 0.604454106817387 + }, + { + "name": "model.layers.1.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.174225291033508e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007113752653822303, + "sensitivity": 0.5178570242603164 + }, + { + "name": "model.layers.1.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.241572555154562e-05, + "sensitivity": 0.6704578479346931 + }, + { + "name": "model.layers.1.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.485859103122493e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007571444730274379, + "sensitivity": 0.5161457909887365 + }, + { + "name": "model.layers.1.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9612852055579424e-05, + "sensitivity": 0.6918091462587476 + }, + { + "name": "model.layers.1.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.636150260419527e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007355489651672542, + "sensitivity": 0.5288312287818265 + }, + { + "name": "model.layers.1.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.993898957967758e-05, + "sensitivity": 0.6608220765217772 + }, + { + "name": "model.layers.1.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.3513436998619e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007413762505166233, + "sensitivity": 0.5230738295211257 + }, + { + "name": "model.layers.1.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.126197695266455e-05, + "sensitivity": 0.697775647531875 + }, + { + "name": "model.layers.1.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.526100833070814e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007590969908051193, + "sensitivity": 0.5675856909411058 + }, + { + "name": "model.layers.1.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0119404224678874e-05, + "sensitivity": 0.7838928925372811 + }, + { + "name": "model.layers.1.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.316608391898626e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007315666298381984, + "sensitivity": 0.573187165551579 + }, + { + "name": "model.layers.1.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5940356105566025e-05, + "sensitivity": 1.1232700925487693 + }, + { + "name": "model.layers.1.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.744641384808347e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006764165009371936, + "sensitivity": 0.515544866960908 + }, + { + "name": "model.layers.1.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.92915021115914e-05, + "sensitivity": 0.7217744705244168 + }, + { + "name": "model.layers.1.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.196989374984696e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007202638080343604, + "sensitivity": 0.5630791192958148 + }, + { + "name": "model.layers.1.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.810360744362697e-05, + "sensitivity": 0.952676883384989 + }, + { + "name": "model.layers.1.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.229907967281179e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007110365550033748, + "sensitivity": 0.5695350375952825 + }, + { + "name": "model.layers.1.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.003324961056933e-05, + "sensitivity": 0.8604997117090291 + }, + { + "name": "model.layers.1.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.221384865057189e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007243648869916797, + "sensitivity": 0.5045773072470656 + }, + { + "name": "model.layers.1.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.751938705448993e-06, + "sensitivity": 1.3835859698943191 + }, + { + "name": "model.layers.1.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.506403795152437e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006411081412807107, + "sensitivity": 0.5951880384716677 + }, + { + "name": "model.layers.1.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006655186880379915, + "sensitivity": 0.5347733054740964 + }, + { + "name": "model.layers.1.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.547451221194933e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007549802539870143, + "sensitivity": 0.5582450191679067 + }, + { + "name": "model.layers.1.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006968966918066144, + "sensitivity": 0.5596353657531932 + }, + { + "name": "model.layers.1.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.712450044688012e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007804572815075517, + "sensitivity": 0.5130251498411098 + }, + { + "name": "model.layers.1.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9856451116502285e-05, + "sensitivity": 0.726034216473246 + }, + { + "name": "model.layers.1.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.285960694185633e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007261476712301373, + "sensitivity": 0.5328406724804157 + }, + { + "name": "model.layers.1.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.902646080357954e-05, + "sensitivity": 0.6541645299090524 + }, + { + "name": "model.layers.1.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.98717349475919e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006953920237720013, + "sensitivity": 0.545202173251164 + }, + { + "name": "model.layers.1.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5473643442383036e-05, + "sensitivity": 0.8567062361254867 + }, + { + "name": "model.layers.1.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.672268343914766e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006545383366756141, + "sensitivity": 0.5524932342585303 + }, + { + "name": "model.layers.1.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.105279317125678e-05, + "sensitivity": 0.7402823940228639 + }, + { + "name": "model.layers.1.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.898332571836363e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007377161527983844, + "sensitivity": 0.5198659536876988 + }, + { + "name": "model.layers.1.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8163044741377234e-05, + "sensitivity": 0.7491417479602756 + }, + { + "name": "model.layers.1.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.228904112504097e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007213937933556736, + "sensitivity": 0.5734752383745237 + }, + { + "name": "model.layers.1.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9510344726732e-05, + "sensitivity": 0.7350354381221457 + }, + { + "name": "model.layers.1.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.305651822913205e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007306559709832072, + "sensitivity": 0.5082377979504902 + }, + { + "name": "model.layers.1.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006715766503475606, + "sensitivity": 0.5398906733224176 + }, + { + "name": "model.layers.1.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.236691660888027e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007296734838746488, + "sensitivity": 0.49871185329574025 + }, + { + "name": "model.layers.1.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.046460475772619e-05, + "sensitivity": 0.6475521480563887 + }, + { + "name": "model.layers.1.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.318912255665055e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007349549559876323, + "sensitivity": 0.5512153371439551 + }, + { + "name": "model.layers.1.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7738448958843946e-05, + "sensitivity": 0.8059062142705675 + }, + { + "name": "model.layers.1.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.254175559661235e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.327655137283728e-05, + "sensitivity": 0.6188513324400853 + }, + { + "name": "model.layers.1.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0171381291002035e-05, + "sensitivity": 1.4806646686297573 + }, + { + "name": "model.layers.1.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.4057363740867e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5805685406085104e-05, + "sensitivity": 0.8186139180290579 + }, + { + "name": "model.layers.1.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.053488323232159e-05, + "sensitivity": 0.6792806663932732 + }, + { + "name": "model.layers.1.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.314900247161859e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007333712419494987, + "sensitivity": 0.4972852873368069 + }, + { + "name": "model.layers.1.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006558268214575946, + "sensitivity": 0.5736437222639301 + }, + { + "name": "model.layers.1.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.132133307801269e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.312305049505085e-05, + "sensitivity": 0.6402156256978115 + }, + { + "name": "model.layers.1.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 1.2993936252314597e-05, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.5860648545640288e-06, + "sensitivity": 2.097979164114025 + }, + { + "name": "model.layers.1.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.960584748114343e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.1.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 6.908195700816577e-06, + "sensitivity": 1.7474623316197488 + }, + { + "name": "model.layers.1.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 5.859585144207813e-06, + "sensitivity": 2.1343460618200747 + }, + { + "name": "model.layers.1.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 4, + "mse": 4.448661638889462e-05, + "sensitivity": 1.2595580437578628 + }, + { + "name": "model.layers.1.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 9.338111340184696e-06, + "sensitivity": 1.5287555831986808 + }, + { + "name": "model.layers.1.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 3.1847102945903316e-05, + "sensitivity": 0.8137678952447148 + }, + { + "name": "model.layers.1.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 4, + "mse": 6.655816832790151e-05, + "sensitivity": 1.4344571446740946 + }, + { + "name": "model.layers.2.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.788936323369853e-05, + "sensitivity": 0.637117571081665 + }, + { + "name": "model.layers.2.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.92528749621124e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006853381637483835, + "sensitivity": 0.5292625168620071 + }, + { + "name": "model.layers.2.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006603162037208676, + "sensitivity": 0.5099343843315627 + }, + { + "name": "model.layers.2.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.916039071962587e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006885470356792212, + "sensitivity": 0.5383619701065838 + }, + { + "name": "model.layers.2.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8043071476276964e-05, + "sensitivity": 0.7901511208644407 + }, + { + "name": "model.layers.2.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.425913170460262e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.483458128059283e-05, + "sensitivity": 0.6151559787240425 + }, + { + "name": "model.layers.2.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006500632152892649, + "sensitivity": 0.5224479702307299 + }, + { + "name": "model.layers.2.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.864437753189122e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006800758419558406, + "sensitivity": 0.516434915779298 + }, + { + "name": "model.layers.2.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006621964275836945, + "sensitivity": 0.5357516082936662 + }, + { + "name": "model.layers.2.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.296368155744858e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007026169914752245, + "sensitivity": 0.5020391801268185 + }, + { + "name": "model.layers.2.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006564076757058501, + "sensitivity": 0.5291995930497548 + }, + { + "name": "model.layers.2.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.847191459906753e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006729754386469722, + "sensitivity": 0.5494191738948431 + }, + { + "name": "model.layers.2.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006531747058033943, + "sensitivity": 0.5424451453172494 + }, + { + "name": "model.layers.2.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.043167104508029e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006917932769283652, + "sensitivity": 0.5175586013374985 + }, + { + "name": "model.layers.2.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.855287236045115e-05, + "sensitivity": 0.6272529683970446 + }, + { + "name": "model.layers.2.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.18402964391862e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007024051155894995, + "sensitivity": 0.5300315797519255 + }, + { + "name": "model.layers.2.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006588708492927253, + "sensitivity": 0.5876723057827589 + }, + { + "name": "model.layers.2.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.969351377643761e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006939381128177047, + "sensitivity": 0.5733248891278955 + }, + { + "name": "model.layers.2.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006776638329029083, + "sensitivity": 0.5271574989151324 + }, + { + "name": "model.layers.2.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.140612072158547e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007107902783900499, + "sensitivity": 0.5559366843677089 + }, + { + "name": "model.layers.2.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006497822469100356, + "sensitivity": 0.5294735033525237 + }, + { + "name": "model.layers.2.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.832420129081584e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006744188140146434, + "sensitivity": 0.5231441727437001 + }, + { + "name": "model.layers.2.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000665354251395911, + "sensitivity": 0.5321946901335889 + }, + { + "name": "model.layers.2.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.975477961328579e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006952101830393076, + "sensitivity": 0.5259397434370704 + }, + { + "name": "model.layers.2.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006540108006447554, + "sensitivity": 0.5048513525104465 + }, + { + "name": "model.layers.2.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.81134486310475e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006742709083482623, + "sensitivity": 0.5262978148800059 + }, + { + "name": "model.layers.2.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.863839032826945e-05, + "sensitivity": 0.6703715924798028 + }, + { + "name": "model.layers.2.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.938485969636531e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000688089698087424, + "sensitivity": 0.5200938695271349 + }, + { + "name": "model.layers.2.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8586061641108245e-05, + "sensitivity": 0.9237234380209465 + }, + { + "name": "model.layers.2.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.031565931152727e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006988599780015647, + "sensitivity": 0.5532940274008371 + }, + { + "name": "model.layers.2.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006515826098620892, + "sensitivity": 0.5492346116743078 + }, + { + "name": "model.layers.2.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.846945327903086e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006772064371034503, + "sensitivity": 0.5522856518020094 + }, + { + "name": "model.layers.2.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006531979888677597, + "sensitivity": 0.5250952719843 + }, + { + "name": "model.layers.2.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.833566092405817e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006774617359042168, + "sensitivity": 0.5260844666104033 + }, + { + "name": "model.layers.2.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006502066971734166, + "sensitivity": 0.5359265831620937 + }, + { + "name": "model.layers.2.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.845467399012705e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006737875519320369, + "sensitivity": 0.5227271346167179 + }, + { + "name": "model.layers.2.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006600776687264442, + "sensitivity": 0.5137320249233672 + }, + { + "name": "model.layers.2.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.987889721836837e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006912198732607067, + "sensitivity": 0.5659112750063078 + }, + { + "name": "model.layers.2.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.844603219884448e-05, + "sensitivity": 0.6100404991673078 + }, + { + "name": "model.layers.2.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.019632792231278e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006926943315193057, + "sensitivity": 0.5473455438023518 + }, + { + "name": "model.layers.2.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000651102396659553, + "sensitivity": 0.5695221530731435 + }, + { + "name": "model.layers.2.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.804732836622861e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006717864307574928, + "sensitivity": 0.5350351552582775 + }, + { + "name": "model.layers.2.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006406318861991167, + "sensitivity": 0.5390368199438017 + }, + { + "name": "model.layers.2.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.79091363306361e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006692288443446159, + "sensitivity": 0.5303933995388403 + }, + { + "name": "model.layers.2.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006477210554294288, + "sensitivity": 0.5504735892614155 + }, + { + "name": "model.layers.2.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.817384476358711e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006730208988301456, + "sensitivity": 0.5196833422682965 + }, + { + "name": "model.layers.2.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006742124678567052, + "sensitivity": 0.5890436954584746 + }, + { + "name": "model.layers.2.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.398703931154159e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00072105647996068, + "sensitivity": 0.5350870112633378 + }, + { + "name": "model.layers.2.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006554084829986095, + "sensitivity": 0.53524745271771 + }, + { + "name": "model.layers.2.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.917395355936605e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006829767371527851, + "sensitivity": 0.5303733738212072 + }, + { + "name": "model.layers.2.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006702264654450119, + "sensitivity": 0.5242864592397053 + }, + { + "name": "model.layers.2.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.053537617844995e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007012556307017803, + "sensitivity": 0.5208583382292724 + }, + { + "name": "model.layers.2.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006572377751581371, + "sensitivity": 0.5776043202321025 + }, + { + "name": "model.layers.2.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.938422873441596e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006880320142954588, + "sensitivity": 0.5631608039445111 + }, + { + "name": "model.layers.2.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006652208976447582, + "sensitivity": 0.5643857546298421 + }, + { + "name": "model.layers.2.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.969920380266558e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006962899933569133, + "sensitivity": 0.5277075076174838 + }, + { + "name": "model.layers.2.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.919697287026793e-05, + "sensitivity": 0.8645927415528301 + }, + { + "name": "model.layers.2.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.332454063340265e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007268571644090116, + "sensitivity": 0.5893619816314745 + }, + { + "name": "model.layers.2.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000657309778034687, + "sensitivity": 0.5276774531742341 + }, + { + "name": "model.layers.2.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.948190846538637e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006853543454781175, + "sensitivity": 0.5117859684057103 + }, + { + "name": "model.layers.2.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.995994069962762e-05, + "sensitivity": 0.6999846551822053 + }, + { + "name": "model.layers.2.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.337795070976426e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007308036438189447, + "sensitivity": 0.5384432380359576 + }, + { + "name": "model.layers.2.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006623267545364797, + "sensitivity": 0.5345988614047849 + }, + { + "name": "model.layers.2.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.923203616475803e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006884669419378042, + "sensitivity": 0.5344720642256285 + }, + { + "name": "model.layers.2.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006558216991834342, + "sensitivity": 0.5552878261669154 + }, + { + "name": "model.layers.2.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.95667984271131e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006911600357852876, + "sensitivity": 0.558485497951545 + }, + { + "name": "model.layers.2.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006603606743738055, + "sensitivity": 0.5191522454533072 + }, + { + "name": "model.layers.2.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.887392262593494e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006860473076812923, + "sensitivity": 0.5182085053663555 + }, + { + "name": "model.layers.2.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006595769664272666, + "sensitivity": 0.5387287782824223 + }, + { + "name": "model.layers.2.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.975117574053002e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006852728547528386, + "sensitivity": 0.5401791905081401 + }, + { + "name": "model.layers.2.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006616559694521129, + "sensitivity": 0.5502344849506853 + }, + { + "name": "model.layers.2.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.168349955260055e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007121736416593194, + "sensitivity": 0.5257197859244577 + }, + { + "name": "model.layers.2.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006602990324608982, + "sensitivity": 0.5352175636436438 + }, + { + "name": "model.layers.2.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.072373253118712e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006975110154598951, + "sensitivity": 0.5253953036227406 + }, + { + "name": "model.layers.2.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.847254578839056e-05, + "sensitivity": 0.6744290943302863 + }, + { + "name": "model.layers.2.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.976164629828418e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006898273131810129, + "sensitivity": 0.5131317138379279 + }, + { + "name": "model.layers.2.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006443810416385531, + "sensitivity": 0.5364398600027781 + }, + { + "name": "model.layers.2.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.75344472508732e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00066965795122087, + "sensitivity": 0.5287747142843991 + }, + { + "name": "model.layers.2.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006555371219292283, + "sensitivity": 0.5298937326809323 + }, + { + "name": "model.layers.2.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.863262231287081e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006783413700759411, + "sensitivity": 0.5360677603850484 + }, + { + "name": "model.layers.2.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006589422700926661, + "sensitivity": 0.52567734290152 + }, + { + "name": "model.layers.2.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.903590931666258e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006865175673738122, + "sensitivity": 0.5113374437129758 + }, + { + "name": "model.layers.2.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.056283018551767e-05, + "sensitivity": 0.8130634937372851 + }, + { + "name": "model.layers.2.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.551108526764438e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007502136286348104, + "sensitivity": 0.5679884884984271 + }, + { + "name": "model.layers.2.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006572939455509186, + "sensitivity": 0.5285530080241079 + }, + { + "name": "model.layers.2.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.910529807806597e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.103175110183656e-05, + "sensitivity": 0.6974900573935633 + }, + { + "name": "model.layers.2.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006402467261068523, + "sensitivity": 0.5193772642978772 + }, + { + "name": "model.layers.2.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.721404932046426e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006634256569668651, + "sensitivity": 0.509148896437688 + }, + { + "name": "model.layers.2.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006636054022237659, + "sensitivity": 0.5575365228207116 + }, + { + "name": "model.layers.2.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.099635356804356e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006969396490603685, + "sensitivity": 0.5495433515091557 + }, + { + "name": "model.layers.2.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006525152130052447, + "sensitivity": 0.5353655557365348 + }, + { + "name": "model.layers.2.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.896843049413292e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006843453738838434, + "sensitivity": 0.5083458433448123 + }, + { + "name": "model.layers.2.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006681729573756456, + "sensitivity": 0.510966516522825 + }, + { + "name": "model.layers.2.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.199109066074016e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007100507500581443, + "sensitivity": 0.5243675741497633 + }, + { + "name": "model.layers.2.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8295827329857275e-05, + "sensitivity": 0.9484956892288682 + }, + { + "name": "model.layers.2.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.046155931471731e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000698285351973027, + "sensitivity": 0.5452995355393195 + }, + { + "name": "model.layers.2.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006641469663009048, + "sensitivity": 0.5122728100893725 + }, + { + "name": "model.layers.2.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.08182403993851e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007040153141133487, + "sensitivity": 0.52989166248 + }, + { + "name": "model.layers.2.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006552995182573795, + "sensitivity": 0.5353256304098736 + }, + { + "name": "model.layers.2.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.916703003094881e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006831820937804878, + "sensitivity": 0.5216248657576118 + }, + { + "name": "model.layers.2.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.982746370136738e-05, + "sensitivity": 0.636830613385323 + }, + { + "name": "model.layers.2.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.224976800695003e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007242219289764762, + "sensitivity": 0.524152812399479 + }, + { + "name": "model.layers.2.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006630783900618553, + "sensitivity": 0.560645864431946 + }, + { + "name": "model.layers.2.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.085374479880556e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007047917461022735, + "sensitivity": 0.5189983170325728 + }, + { + "name": "model.layers.2.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000661292695440352, + "sensitivity": 0.538721496916462 + }, + { + "name": "model.layers.2.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.903252713324036e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006858484703116119, + "sensitivity": 0.5175842759376842 + }, + { + "name": "model.layers.2.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006530710961669683, + "sensitivity": 0.5174343079627206 + }, + { + "name": "model.layers.2.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.885612495148962e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006827026372775435, + "sensitivity": 0.5384035207869178 + }, + { + "name": "model.layers.2.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006474404945038259, + "sensitivity": 0.5591837012619704 + }, + { + "name": "model.layers.2.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.764767365690204e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000665488769300282, + "sensitivity": 0.5344813831108406 + }, + { + "name": "model.layers.2.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0248272347962484e-05, + "sensitivity": 0.8088675037872083 + }, + { + "name": "model.layers.2.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.614799303861219e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007504869136027992, + "sensitivity": 0.5237759632866068 + }, + { + "name": "model.layers.2.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006573947030119598, + "sensitivity": 0.5319763064105894 + }, + { + "name": "model.layers.2.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.943034011579584e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006883634487167001, + "sensitivity": 0.5066853077842175 + }, + { + "name": "model.layers.2.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006520501337945461, + "sensitivity": 0.5203838029279557 + }, + { + "name": "model.layers.2.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.995697733851557e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006901883753016591, + "sensitivity": 0.5290526117255341 + }, + { + "name": "model.layers.2.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006562476046383381, + "sensitivity": 0.5281240206977428 + }, + { + "name": "model.layers.2.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.860451324224414e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006805011071264744, + "sensitivity": 0.5461121242462301 + }, + { + "name": "model.layers.2.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000656422576867044, + "sensitivity": 0.5200439116695399 + }, + { + "name": "model.layers.2.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.915557608204836e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006836946122348309, + "sensitivity": 0.5328029935690293 + }, + { + "name": "model.layers.2.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006833894876763225, + "sensitivity": 0.5645945286382655 + }, + { + "name": "model.layers.2.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.547567181769409e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007568466826342046, + "sensitivity": 0.5228128781431518 + }, + { + "name": "model.layers.2.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.886183862457983e-05, + "sensitivity": 0.6841249970844974 + }, + { + "name": "model.layers.2.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.953453978690959e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006884029135107994, + "sensitivity": 0.5690201736260146 + }, + { + "name": "model.layers.2.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006462761084549129, + "sensitivity": 0.5673701104285848 + }, + { + "name": "model.layers.2.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.850297384313308e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0109508922323585e-05, + "sensitivity": 1.0060064428874793 + }, + { + "name": "model.layers.2.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006560714682564139, + "sensitivity": 0.5284611704128155 + }, + { + "name": "model.layers.2.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.948444936620945e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006893288227729499, + "sensitivity": 0.5702227039931743 + }, + { + "name": "model.layers.2.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 1.577230796101503e-05, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.7074335119104944e-06, + "sensitivity": 2.098499783883584 + }, + { + "name": "model.layers.2.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.901593229078571e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.2.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.508206878497731e-06, + "sensitivity": 2.10002572709809 + }, + { + "name": "model.layers.2.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 7.818973244866356e-06, + "sensitivity": 2.147258117697571 + }, + { + "name": "model.layers.2.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 4, + "mse": 4.0905903006205335e-05, + "sensitivity": 1.6965800120929972 + }, + { + "name": "model.layers.2.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.0648647730704397e-05, + "sensitivity": 1.3951812998881747 + }, + { + "name": "model.layers.2.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 3.31717892549932e-05, + "sensitivity": 0.6802548373058802 + }, + { + "name": "model.layers.2.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 4, + "mse": 6.339624087559059e-05, + "sensitivity": 1.3975228176289385 + }, + { + "name": "model.layers.3.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.00063593580853194, + "sensitivity": 0.5430232024275826 + }, + { + "name": "model.layers.3.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.87619183534116e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006775655783712864, + "sensitivity": 0.5364652703539503 + }, + { + "name": "model.layers.3.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.091729301260784e-05, + "sensitivity": 0.8758214002175702 + }, + { + "name": "model.layers.3.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.550861826326582e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007419133326038718, + "sensitivity": 0.5031770573616399 + }, + { + "name": "model.layers.3.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006539140595123172, + "sensitivity": 0.5156224245959506 + }, + { + "name": "model.layers.3.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.041358346919878e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006979070021770895, + "sensitivity": 0.5337455090844447 + }, + { + "name": "model.layers.3.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.910659092478454e-05, + "sensitivity": 0.7615865120359873 + }, + { + "name": "model.layers.3.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.199755375746463e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007079739589244127, + "sensitivity": 0.5186877673014849 + }, + { + "name": "model.layers.3.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.741295899497345e-05, + "sensitivity": 0.6104928520252837 + }, + { + "name": "model.layers.3.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.986527185086743e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006870722281746566, + "sensitivity": 0.5212532050489352 + }, + { + "name": "model.layers.3.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9157471696380526e-05, + "sensitivity": 0.7005442004099369 + }, + { + "name": "model.layers.3.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.21246954324306e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007166705909185112, + "sensitivity": 0.5068299902955895 + }, + { + "name": "model.layers.3.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006489607039839029, + "sensitivity": 0.5702282640285534 + }, + { + "name": "model.layers.3.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.028569714544574e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000688763742800802, + "sensitivity": 0.5151941100294097 + }, + { + "name": "model.layers.3.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006581756169907749, + "sensitivity": 0.562388515824322 + }, + { + "name": "model.layers.3.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.113843369348615e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007013880531303585, + "sensitivity": 0.5320735089131359 + }, + { + "name": "model.layers.3.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.792729643872008e-05, + "sensitivity": 0.6165566741934022 + }, + { + "name": "model.layers.3.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.101906819822034e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006918259314261377, + "sensitivity": 0.5277533306909968 + }, + { + "name": "model.layers.3.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.773475277237594e-05, + "sensitivity": 1.065904351227277 + }, + { + "name": "model.layers.3.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.075218266232696e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.182939978316426e-05, + "sensitivity": 0.8094881146101557 + }, + { + "name": "model.layers.3.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.902955308556557e-05, + "sensitivity": 0.6117015953663638 + }, + { + "name": "model.layers.3.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.193683361743751e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.305395800154656e-05, + "sensitivity": 0.7475151547380012 + }, + { + "name": "model.layers.3.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.426580901257694e-05, + "sensitivity": 0.633102349523764 + }, + { + "name": "model.layers.3.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.676744763150054e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006479050498455763, + "sensitivity": 0.551328686677978 + }, + { + "name": "model.layers.3.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.48198695469182e-05, + "sensitivity": 0.6350401600256882 + }, + { + "name": "model.layers.3.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.833800855725713e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006586072267964482, + "sensitivity": 0.5943592141304582 + }, + { + "name": "model.layers.3.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006400199490599334, + "sensitivity": 0.5501998948882761 + }, + { + "name": "model.layers.3.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.879227273908327e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006750888423994184, + "sensitivity": 0.5385456308886837 + }, + { + "name": "model.layers.3.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006544290808960795, + "sensitivity": 0.5306381212501703 + }, + { + "name": "model.layers.3.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.093291062825301e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007017123280093074, + "sensitivity": 0.5151548891316297 + }, + { + "name": "model.layers.3.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000645527383312583, + "sensitivity": 0.5463274425564426 + }, + { + "name": "model.layers.3.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.935831381975731e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006828274927102029, + "sensitivity": 0.5333471389618857 + }, + { + "name": "model.layers.3.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.858881559106521e-05, + "sensitivity": 0.7330903875455574 + }, + { + "name": "model.layers.3.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.230936833162559e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006992520648054779, + "sensitivity": 0.5205404914456199 + }, + { + "name": "model.layers.3.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006345001165755093, + "sensitivity": 0.554377005278974 + }, + { + "name": "model.layers.3.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.920819035054592e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000684410217218101, + "sensitivity": 0.5487942695479187 + }, + { + "name": "model.layers.3.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7502795243635774e-05, + "sensitivity": 0.6828860302131479 + }, + { + "name": "model.layers.3.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.009514663674054e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.131693226052448e-05, + "sensitivity": 0.8027049204789443 + }, + { + "name": "model.layers.3.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006253503961488605, + "sensitivity": 0.5621347816845306 + }, + { + "name": "model.layers.3.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.734432875215134e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006615376914851367, + "sensitivity": 0.5059224374696656 + }, + { + "name": "model.layers.3.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5044372857082635e-05, + "sensitivity": 0.696338610026166 + }, + { + "name": "model.layers.3.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.73208239984524e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006520901224575937, + "sensitivity": 0.5154749613399006 + }, + { + "name": "model.layers.3.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8320682001067325e-05, + "sensitivity": 0.8175322134037014 + }, + { + "name": "model.layers.3.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.507033845082333e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007161802495829761, + "sensitivity": 0.5376540225314611 + }, + { + "name": "model.layers.3.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.683034396497533e-05, + "sensitivity": 0.9988975464625485 + }, + { + "name": "model.layers.3.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.148384841253574e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007014616276137531, + "sensitivity": 0.5217756401296084 + }, + { + "name": "model.layers.3.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006409456254914403, + "sensitivity": 0.5978135238094178 + }, + { + "name": "model.layers.3.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.939829748058401e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006849629571661353, + "sensitivity": 0.548431495747174 + }, + { + "name": "model.layers.3.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0148036380996928e-05, + "sensitivity": 1.4424507097074126 + }, + { + "name": "model.layers.3.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.016672386977007e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006866276962682605, + "sensitivity": 0.5846404749955542 + }, + { + "name": "model.layers.3.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000626497610937804, + "sensitivity": 0.5449074783918296 + }, + { + "name": "model.layers.3.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.828055691381451e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000664094346575439, + "sensitivity": 0.5567688627763755 + }, + { + "name": "model.layers.3.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006314413039945066, + "sensitivity": 0.5564190051450675 + }, + { + "name": "model.layers.3.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.917506769037573e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006772349588572979, + "sensitivity": 0.5356475827492617 + }, + { + "name": "model.layers.3.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.946636520093307e-05, + "sensitivity": 0.6127192817404247 + }, + { + "name": "model.layers.3.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.572028610207781e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007238445687107742, + "sensitivity": 0.5789147539468882 + }, + { + "name": "model.layers.3.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.965561649645679e-05, + "sensitivity": 0.7090424618148079 + }, + { + "name": "model.layers.3.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.521704563056119e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000710384629201144, + "sensitivity": 0.5258531580553331 + }, + { + "name": "model.layers.3.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6439614127157256e-05, + "sensitivity": 0.6625542175648291 + }, + { + "name": "model.layers.3.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.995320293550321e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.01209576416295e-05, + "sensitivity": 0.6532757369505087 + }, + { + "name": "model.layers.3.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.503774082171731e-05, + "sensitivity": 0.6438836822286116 + }, + { + "name": "model.layers.3.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.718124498343968e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006558168679475784, + "sensitivity": 0.5197857729688911 + }, + { + "name": "model.layers.3.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6219294492620975e-05, + "sensitivity": 0.7374226579422996 + }, + { + "name": "model.layers.3.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.879280706722056e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006719309603795409, + "sensitivity": 0.5258574294089011 + }, + { + "name": "model.layers.3.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.006429248373024e-05, + "sensitivity": 1.0739160094167717 + }, + { + "name": "model.layers.3.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.393767080226098e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007383766351267695, + "sensitivity": 0.5649355831799652 + }, + { + "name": "model.layers.3.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.762153159594163e-05, + "sensitivity": 0.6793091596006905 + }, + { + "name": "model.layers.3.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.07872038926871e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006984722567722201, + "sensitivity": 0.5271541299642981 + }, + { + "name": "model.layers.3.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.989874989609234e-05, + "sensitivity": 1.0466011786443667 + }, + { + "name": "model.layers.3.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.391964575414022e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007280685822479427, + "sensitivity": 0.5081441401570113 + }, + { + "name": "model.layers.3.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4615164117421955e-05, + "sensitivity": 1.1189854924578508 + }, + { + "name": "model.layers.3.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.781472509625019e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006547452649101615, + "sensitivity": 0.5169401879797204 + }, + { + "name": "model.layers.3.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0734313036664389e-05, + "sensitivity": 1.369552824379895 + }, + { + "name": "model.layers.3.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.147006388346199e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007067007245495915, + "sensitivity": 0.5884208019055 + }, + { + "name": "model.layers.3.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0428188033984043e-05, + "sensitivity": 1.2413557413837366 + }, + { + "name": "model.layers.3.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.269786467782978e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.279387162066996e-05, + "sensitivity": 0.6032397191324705 + }, + { + "name": "model.layers.3.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.654348569805734e-05, + "sensitivity": 0.7034706375817534 + }, + { + "name": "model.layers.3.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.896890797885135e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000680685683619231, + "sensitivity": 0.5763596883582942 + }, + { + "name": "model.layers.3.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0140966525068507e-05, + "sensitivity": 0.8305808928412759 + }, + { + "name": "model.layers.3.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.331507620416232e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007293893722817302, + "sensitivity": 0.5057488615266915 + }, + { + "name": "model.layers.3.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006461211014539003, + "sensitivity": 0.5508058635562912 + }, + { + "name": "model.layers.3.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.982010407024063e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000691656197886914, + "sensitivity": 0.5308872852423764 + }, + { + "name": "model.layers.3.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006294729537330568, + "sensitivity": 0.5363988562641436 + }, + { + "name": "model.layers.3.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.834717171637749e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000676157302223146, + "sensitivity": 0.517707507129877 + }, + { + "name": "model.layers.3.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006400012644007802, + "sensitivity": 0.5314646919099445 + }, + { + "name": "model.layers.3.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.881033757759724e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000677260453812778, + "sensitivity": 0.5201251119964416 + }, + { + "name": "model.layers.3.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.826718916068785e-05, + "sensitivity": 0.7963243547561945 + }, + { + "name": "model.layers.3.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.424131129278976e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007170999306254089, + "sensitivity": 0.5605271764377608 + }, + { + "name": "model.layers.3.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.965044692857191e-05, + "sensitivity": 1.121931476295204 + }, + { + "name": "model.layers.3.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.377862860063033e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.491619569715112e-05, + "sensitivity": 0.7275503558516132 + }, + { + "name": "model.layers.3.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.649604645441286e-05, + "sensitivity": 0.9877248564071845 + }, + { + "name": "model.layers.3.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.062484771973686e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007004417711868882, + "sensitivity": 0.5217309481637598 + }, + { + "name": "model.layers.3.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006284484989009798, + "sensitivity": 0.5350580223049145 + }, + { + "name": "model.layers.3.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.770875191046798e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8811798226088285e-05, + "sensitivity": 0.6733398746406911 + }, + { + "name": "model.layers.3.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006422955193556845, + "sensitivity": 0.5505917269442313 + }, + { + "name": "model.layers.3.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.993833269712923e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006958412704989314, + "sensitivity": 0.5854761677525975 + }, + { + "name": "model.layers.3.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006699791993014514, + "sensitivity": 0.5358264929659072 + }, + { + "name": "model.layers.3.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.198092705744784e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007099717622622848, + "sensitivity": 0.5346157036245428 + }, + { + "name": "model.layers.3.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006312435725703835, + "sensitivity": 0.5251535189339226 + }, + { + "name": "model.layers.3.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.814833912154427e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9694422816392034e-05, + "sensitivity": 0.6193281486876698 + }, + { + "name": "model.layers.3.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8780813560588285e-05, + "sensitivity": 0.7231492023329549 + }, + { + "name": "model.layers.3.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.200470465955732e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.326285802060738e-05, + "sensitivity": 0.7051816550862493 + }, + { + "name": "model.layers.3.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.654421329381876e-05, + "sensitivity": 0.6031831838899582 + }, + { + "name": "model.layers.3.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.833868499394157e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006718530785292387, + "sensitivity": 0.5345202583615352 + }, + { + "name": "model.layers.3.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.719436376239173e-05, + "sensitivity": 0.9031337720154082 + }, + { + "name": "model.layers.3.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.584708671653061e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.344912981148809e-05, + "sensitivity": 0.7556124787183653 + }, + { + "name": "model.layers.3.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006591096753254533, + "sensitivity": 0.534234559632827 + }, + { + "name": "model.layers.3.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.317984571069246e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007041746284812689, + "sensitivity": 0.5190675988572403 + }, + { + "name": "model.layers.3.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5427197366952896e-05, + "sensitivity": 0.6398885719774335 + }, + { + "name": "model.layers.3.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.706584715881036e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006582773639820516, + "sensitivity": 0.5377715233347513 + }, + { + "name": "model.layers.3.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8989502576878294e-05, + "sensitivity": 0.7289309938505997 + }, + { + "name": "model.layers.3.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.198083042363578e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.340871914289892e-05, + "sensitivity": 0.6531462438374389 + }, + { + "name": "model.layers.3.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006652008160017431, + "sensitivity": 0.5171420998287919 + }, + { + "name": "model.layers.3.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.12036728853127e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007055251626297832, + "sensitivity": 0.5676039696237534 + }, + { + "name": "model.layers.3.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006474289111793041, + "sensitivity": 0.5876028630967646 + }, + { + "name": "model.layers.3.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.983672508591553e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000688107218593359, + "sensitivity": 0.5147396395345538 + }, + { + "name": "model.layers.3.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006492796819657087, + "sensitivity": 0.5222609367409197 + }, + { + "name": "model.layers.3.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.036588615643268e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006943026091903448, + "sensitivity": 0.5308839089224235 + }, + { + "name": "model.layers.3.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006468555075116456, + "sensitivity": 0.5260981794844644 + }, + { + "name": "model.layers.3.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.986103133182041e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006897455314174294, + "sensitivity": 0.5160467543670397 + }, + { + "name": "model.layers.3.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006478052819147706, + "sensitivity": 0.5387773289182812 + }, + { + "name": "model.layers.3.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.009663593431469e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006892017554491758, + "sensitivity": 0.5268405750863576 + }, + { + "name": "model.layers.3.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006807054160162807, + "sensitivity": 0.5244083928405672 + }, + { + "name": "model.layers.3.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.457566996687092e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007268574554473162, + "sensitivity": 0.5985906193100711 + }, + { + "name": "model.layers.3.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0341043889638968e-05, + "sensitivity": 1.292051315034703 + }, + { + "name": "model.layers.3.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.742347634120961e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.618005863856524e-05, + "sensitivity": 0.7489929393235137 + }, + { + "name": "model.layers.3.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7905032008420676e-05, + "sensitivity": 0.8416593950138431 + }, + { + "name": "model.layers.3.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.132080443421728e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006992376293055713, + "sensitivity": 0.5806547005250491 + }, + { + "name": "model.layers.3.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 1.4707671653013676e-05, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.8423783103571623e-06, + "sensitivity": 2.098377235895172 + }, + { + "name": "model.layers.3.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.410683338093804e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.3.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.288716134695278e-06, + "sensitivity": 2.0998427026721727 + }, + { + "name": "model.layers.3.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 4.266714768164093e-06, + "sensitivity": 2.1413734045911217 + }, + { + "name": "model.layers.3.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00016959359345491976, + "sensitivity": 1.1131602589444205 + }, + { + "name": "model.layers.3.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 9.776992555998731e-06, + "sensitivity": 1.9396941305604074 + }, + { + "name": "model.layers.3.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 2, + "mse": 0.0004930543364025652, + "sensitivity": 0.5919940435703095 + }, + { + "name": "model.layers.3.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002845010021701455, + "sensitivity": 0.7547897019998614 + }, + { + "name": "model.layers.4.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.959023373085074e-06, + "sensitivity": 1.7346312086510745 + }, + { + "name": "model.layers.4.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.704270051865024e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006549562676809728, + "sensitivity": 0.5199055569317109 + }, + { + "name": "model.layers.4.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0713122719607782e-05, + "sensitivity": 1.2416166142285858 + }, + { + "name": "model.layers.4.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.377402996804449e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007140231318771839, + "sensitivity": 0.5937989023630675 + }, + { + "name": "model.layers.4.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.570126086240634e-05, + "sensitivity": 0.9219779411151934 + }, + { + "name": "model.layers.4.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.913018412684323e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006761299446225166, + "sensitivity": 0.5182963202860243 + }, + { + "name": "model.layers.4.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006638127379119396, + "sensitivity": 0.5313759064184411 + }, + { + "name": "model.layers.4.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.13152849382459e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007027533720247447, + "sensitivity": 0.5392272895470478 + }, + { + "name": "model.layers.4.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.153027061372995e-05, + "sensitivity": 0.6808088158597838 + }, + { + "name": "model.layers.4.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.620541057600349e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.810248305555433e-05, + "sensitivity": 0.6028488418616891 + }, + { + "name": "model.layers.4.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000610309827607125, + "sensitivity": 0.5605668759695749 + }, + { + "name": "model.layers.4.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.62465345410601e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006487327045761049, + "sensitivity": 0.535803340485285 + }, + { + "name": "model.layers.4.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7855759223457426e-05, + "sensitivity": 0.6307544232643381 + }, + { + "name": "model.layers.4.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.018855174261262e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006865696050226688, + "sensitivity": 0.5187692507264638 + }, + { + "name": "model.layers.4.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.309467163286172e-06, + "sensitivity": 2.0965146858119565 + }, + { + "name": "model.layers.4.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.221657713467721e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007054675370454788, + "sensitivity": 0.5258228971118779 + }, + { + "name": "model.layers.4.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.017951818648726e-05, + "sensitivity": 0.8021256530441474 + }, + { + "name": "model.layers.4.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.445762892326456e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007271431386470795, + "sensitivity": 0.5144820788436422 + }, + { + "name": "model.layers.4.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5640601203776896e-05, + "sensitivity": 0.7938536134377926 + }, + { + "name": "model.layers.4.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.896031325391959e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000684570986777544, + "sensitivity": 0.5200069689255795 + }, + { + "name": "model.layers.4.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7598110288381577e-05, + "sensitivity": 0.9031943538194651 + }, + { + "name": "model.layers.4.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.073951226426288e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000686062965542078, + "sensitivity": 0.5316851545941069 + }, + { + "name": "model.layers.4.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.564516322920099e-05, + "sensitivity": 0.7047255894974899 + }, + { + "name": "model.layers.4.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.906859996684943e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006784327561035752, + "sensitivity": 0.5095191294543889 + }, + { + "name": "model.layers.4.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.516660611552652e-06, + "sensitivity": 1.4334432828157406 + }, + { + "name": "model.layers.4.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.523261847883987e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006367077003233135, + "sensitivity": 0.5787417372964158 + }, + { + "name": "model.layers.4.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8555036957841367e-05, + "sensitivity": 0.8164007384490011 + }, + { + "name": "model.layers.4.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.308707156676974e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007151543977670372, + "sensitivity": 0.5201783077886792 + }, + { + "name": "model.layers.4.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.743873043684289e-05, + "sensitivity": 0.8079103575090971 + }, + { + "name": "model.layers.4.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.912332881052862e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006763706333003938, + "sensitivity": 0.5778736155851006 + }, + { + "name": "model.layers.4.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8498946600593626e-05, + "sensitivity": 0.632088950096355 + }, + { + "name": "model.layers.4.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.227319317986257e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000708900042809546, + "sensitivity": 0.5239415335722322 + }, + { + "name": "model.layers.4.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8306133723817766e-05, + "sensitivity": 0.7203242586609653 + }, + { + "name": "model.layers.4.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.970799747956335e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.063139153411612e-05, + "sensitivity": 0.6428740079972061 + }, + { + "name": "model.layers.4.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7433993788436055e-05, + "sensitivity": 1.0890961528421093 + }, + { + "name": "model.layers.4.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.148197257971333e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000705514510627836, + "sensitivity": 0.5070438651210525 + }, + { + "name": "model.layers.4.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.1027269111946225e-05, + "sensitivity": 0.7232989010540429 + }, + { + "name": "model.layers.4.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.530676728289109e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007466083625331521, + "sensitivity": 0.5402790039990331 + }, + { + "name": "model.layers.4.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9017234889324754e-05, + "sensitivity": 1.0965640101616998 + }, + { + "name": "model.layers.4.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.272433665799326e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007178797386586666, + "sensitivity": 0.509755462156742 + }, + { + "name": "model.layers.4.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7358101912541315e-05, + "sensitivity": 0.8958166245357477 + }, + { + "name": "model.layers.4.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.074166094549582e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007001352496445179, + "sensitivity": 0.5112674749472584 + }, + { + "name": "model.layers.4.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.433113983599469e-05, + "sensitivity": 0.7794476399656942 + }, + { + "name": "model.layers.4.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.944759777776198e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006729679880663753, + "sensitivity": 0.5240349029615421 + }, + { + "name": "model.layers.4.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.609160770196468e-06, + "sensitivity": 1.2677153086862711 + }, + { + "name": "model.layers.4.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.717171234209673e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006343355635181069, + "sensitivity": 0.5342927937585691 + }, + { + "name": "model.layers.4.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4938122048042715e-05, + "sensitivity": 0.8171639088829395 + }, + { + "name": "model.layers.4.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.81988842895953e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006602167850360274, + "sensitivity": 0.5300885906130786 + }, + { + "name": "model.layers.4.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.506798333954066e-05, + "sensitivity": 0.704250212740196 + }, + { + "name": "model.layers.4.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.852811000295333e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006746356375515461, + "sensitivity": 0.554251167275761 + }, + { + "name": "model.layers.4.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3919513447908685e-05, + "sensitivity": 1.023908276174196 + }, + { + "name": "model.layers.4.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.751232947659446e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006607001414522529, + "sensitivity": 0.5582343361133111 + }, + { + "name": "model.layers.4.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7377066696062684e-05, + "sensitivity": 1.0741872383486537 + }, + { + "name": "model.layers.4.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.193357648953679e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007175027276389301, + "sensitivity": 0.5317101716642794 + }, + { + "name": "model.layers.4.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.796353070763871e-05, + "sensitivity": 0.6159290997042038 + }, + { + "name": "model.layers.4.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.995516403345391e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006896600825712085, + "sensitivity": 0.524997326269811 + }, + { + "name": "model.layers.4.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.646081262966618e-05, + "sensitivity": 0.865569014339094 + }, + { + "name": "model.layers.4.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.977705086479546e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006867594784125686, + "sensitivity": 0.5296383521306762 + }, + { + "name": "model.layers.4.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.377529305405915e-05, + "sensitivity": 1.091944070853306 + }, + { + "name": "model.layers.4.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.929414328420535e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006854366511106491, + "sensitivity": 0.571029937491516 + }, + { + "name": "model.layers.4.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.49130309082102e-05, + "sensitivity": 0.8289599335219076 + }, + { + "name": "model.layers.4.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.077071361687558e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006736404611729085, + "sensitivity": 0.52190277428335 + }, + { + "name": "model.layers.4.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.949939804850146e-05, + "sensitivity": 0.7021213464657461 + }, + { + "name": "model.layers.4.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.466201512012049e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007363377371802926, + "sensitivity": 0.5240762317457173 + }, + { + "name": "model.layers.4.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0485124221304432e-05, + "sensitivity": 1.2091829771167604 + }, + { + "name": "model.layers.4.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.355311370498384e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007276776013895869, + "sensitivity": 0.5350684047084941 + }, + { + "name": "model.layers.4.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.0414713768986985e-05, + "sensitivity": 1.1954192346210963 + }, + { + "name": "model.layers.4.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.342640747585392e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.245885404292494e-05, + "sensitivity": 0.6884716238135367 + }, + { + "name": "model.layers.4.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.1937235032964963e-06, + "sensitivity": 2.016860345775247 + }, + { + "name": "model.layers.4.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.930723432356899e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006739184027537704, + "sensitivity": 0.5483003430478943 + }, + { + "name": "model.layers.4.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.823510582558811e-05, + "sensitivity": 0.6324875784644 + }, + { + "name": "model.layers.4.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.320157126538106e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007200042600743473, + "sensitivity": 0.551155942535246 + }, + { + "name": "model.layers.4.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.438040534500033e-05, + "sensitivity": 0.9350599601086184 + }, + { + "name": "model.layers.4.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.0775931842727e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.78917060920503e-05, + "sensitivity": 0.7650789000076501 + }, + { + "name": "model.layers.4.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.909376704948954e-05, + "sensitivity": 0.8202056554845505 + }, + { + "name": "model.layers.4.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.100538030295866e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000704023870639503, + "sensitivity": 0.5285862520875373 + }, + { + "name": "model.layers.4.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.693483035429381e-05, + "sensitivity": 0.8736741529223327 + }, + { + "name": "model.layers.4.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.222966248969897e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007106876000761986, + "sensitivity": 0.583445400294085 + }, + { + "name": "model.layers.4.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.017299892846495e-05, + "sensitivity": 0.6698673774459906 + }, + { + "name": "model.layers.4.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.503350959974341e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007395264692604542, + "sensitivity": 0.5700756284276312 + }, + { + "name": "model.layers.4.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.209360097069293e-05, + "sensitivity": 1.0926622424704369 + }, + { + "name": "model.layers.4.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.496142989613872e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006210344727151096, + "sensitivity": 0.5283334296229076 + }, + { + "name": "model.layers.4.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.060933810658753e-05, + "sensitivity": 0.7141256202946706 + }, + { + "name": "model.layers.4.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.611483058804879e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007574378396384418, + "sensitivity": 0.5309336864195771 + }, + { + "name": "model.layers.4.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5278953368542716e-05, + "sensitivity": 0.6024113454213506 + }, + { + "name": "model.layers.4.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.88068814977305e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000673910602927208, + "sensitivity": 0.5348970477030579 + }, + { + "name": "model.layers.4.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.725361451273784e-06, + "sensitivity": 1.534273639951054 + }, + { + "name": "model.layers.4.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.860005103386356e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006267968565225601, + "sensitivity": 0.5489913871802142 + }, + { + "name": "model.layers.4.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.67998577025719e-05, + "sensitivity": 1.1807153799036776 + }, + { + "name": "model.layers.4.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.182884817462764e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006991793634369969, + "sensitivity": 0.5185081241337985 + }, + { + "name": "model.layers.4.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.039304152072873e-05, + "sensitivity": 1.3038230169811424 + }, + { + "name": "model.layers.4.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.002355235068535e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006890959921292961, + "sensitivity": 0.5297047279403019 + }, + { + "name": "model.layers.4.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5416327086277306e-05, + "sensitivity": 0.9179303270804696 + }, + { + "name": "model.layers.4.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.009824460306845e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006637977785430849, + "sensitivity": 0.5522048112531788 + }, + { + "name": "model.layers.4.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.630448868032545e-05, + "sensitivity": 0.8070689799551635 + }, + { + "name": "model.layers.4.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.955032520432724e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006774622015655041, + "sensitivity": 0.5880112787340146 + }, + { + "name": "model.layers.4.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0157731594517827e-05, + "sensitivity": 1.2135542491252087 + }, + { + "name": "model.layers.4.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.545716016466031e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.038389983586967e-05, + "sensitivity": 0.9323589220151864 + }, + { + "name": "model.layers.4.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.676992704044096e-06, + "sensitivity": 1.2849825942595428 + }, + { + "name": "model.layers.4.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.675686907125055e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006298433290794492, + "sensitivity": 0.5061507542744497 + }, + { + "name": "model.layers.4.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.576513548381627e-06, + "sensitivity": 1.3848172265230652 + }, + { + "name": "model.layers.4.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.680072945324355e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5492269893875346e-05, + "sensitivity": 0.6275082632314002 + }, + { + "name": "model.layers.4.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.768839764641598e-05, + "sensitivity": 0.7287039377070708 + }, + { + "name": "model.layers.4.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.140807613519428e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000706191174685955, + "sensitivity": 0.5502893097144734 + }, + { + "name": "model.layers.4.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0309846402378753e-05, + "sensitivity": 1.4476616898373786 + }, + { + "name": "model.layers.4.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.682955131509516e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.3294981373474e-05, + "sensitivity": 0.7825293612413317 + }, + { + "name": "model.layers.4.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.719540058635175e-05, + "sensitivity": 0.8004786904564992 + }, + { + "name": "model.layers.4.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.98266524320934e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0802831285400316e-05, + "sensitivity": 0.7692693835377475 + }, + { + "name": "model.layers.4.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006590033881366253, + "sensitivity": 0.5382897472288203 + }, + { + "name": "model.layers.4.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.168420441099443e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007029214175418019, + "sensitivity": 0.533473039544969 + }, + { + "name": "model.layers.4.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0979662874888163e-05, + "sensitivity": 1.4187784956459988 + }, + { + "name": "model.layers.4.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.304548492153117e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007192965131253004, + "sensitivity": 0.5147991117689501 + }, + { + "name": "model.layers.4.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006418500561267138, + "sensitivity": 0.5357255908001842 + }, + { + "name": "model.layers.4.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.123759703768883e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.1001726862741634e-05, + "sensitivity": 0.7788451550669223 + }, + { + "name": "model.layers.4.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006414218223653734, + "sensitivity": 0.5724397024626909 + }, + { + "name": "model.layers.4.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.955604933660652e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006735196220688522, + "sensitivity": 0.5213538938587077 + }, + { + "name": "model.layers.4.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6913384469226e-05, + "sensitivity": 0.7962210879346985 + }, + { + "name": "model.layers.4.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.287492624323932e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007062514196150005, + "sensitivity": 0.52689865220847 + }, + { + "name": "model.layers.4.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6400713219773024e-05, + "sensitivity": 1.1258377371068682 + }, + { + "name": "model.layers.4.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.121783258095093e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006909125950187445, + "sensitivity": 0.5351683018522232 + }, + { + "name": "model.layers.4.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.836490890942514e-05, + "sensitivity": 0.7554787803486829 + }, + { + "name": "model.layers.4.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.338881917145045e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.446975748986006e-05, + "sensitivity": 0.7499779706196759 + }, + { + "name": "model.layers.4.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.48386968957493e-06, + "sensitivity": 1.6020962215949133 + }, + { + "name": "model.layers.4.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.603965291811619e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5742901167832315e-05, + "sensitivity": 0.6006346031555789 + }, + { + "name": "model.layers.4.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7089910114882514e-05, + "sensitivity": 0.642136559694088 + }, + { + "name": "model.layers.4.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.960771432000911e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006843778537586331, + "sensitivity": 0.5418152861423355 + }, + { + "name": "model.layers.4.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.311377390171401e-05, + "sensitivity": 1.1746644346618864 + }, + { + "name": "model.layers.4.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.518805892279488e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006235972978174686, + "sensitivity": 0.5478413725982015 + }, + { + "name": "model.layers.4.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 1.053935193340294e-05, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.814705228753155e-06, + "sensitivity": 2.0985073355307877 + }, + { + "name": "model.layers.4.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.592649010097375e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.4.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.258909605894587e-06, + "sensitivity": 2.1021021817516923 + }, + { + "name": "model.layers.4.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 4.3304680730216205e-06, + "sensitivity": 2.139205155040418 + }, + { + "name": "model.layers.4.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00015503790928050876, + "sensitivity": 1.0655228926901876 + }, + { + "name": "model.layers.4.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 8.80186416907236e-06, + "sensitivity": 1.8968979120843217 + }, + { + "name": "model.layers.4.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 4.173161505605094e-05, + "sensitivity": 0.6830911372138859 + }, + { + "name": "model.layers.4.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002661650942172855, + "sensitivity": 0.8965080881700844 + }, + { + "name": "model.layers.5.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.174215039005503e-05, + "sensitivity": 0.9843739150451165 + }, + { + "name": "model.layers.5.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.564810408031917e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5830976634752005e-05, + "sensitivity": 0.6337483774187305 + }, + { + "name": "model.layers.5.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.842257814947516e-05, + "sensitivity": 0.6932919515382885 + }, + { + "name": "model.layers.5.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.355699611049204e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007030800334177911, + "sensitivity": 0.516178696787411 + }, + { + "name": "model.layers.5.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.353846790967509e-05, + "sensitivity": 0.6973962512973638 + }, + { + "name": "model.layers.5.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.496877406585554e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006247282726690173, + "sensitivity": 0.5252865660808536 + }, + { + "name": "model.layers.5.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3906591347185895e-05, + "sensitivity": 1.0536377867547408 + }, + { + "name": "model.layers.5.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.070972062843794e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006397582474164665, + "sensitivity": 0.5386142481473728 + }, + { + "name": "model.layers.5.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.2231858717277646e-05, + "sensitivity": 1.033181185567674 + }, + { + "name": "model.layers.5.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.714136364076694e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006197073380462825, + "sensitivity": 0.519867892027612 + }, + { + "name": "model.layers.5.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.725809023715556e-05, + "sensitivity": 0.7073294208690512 + }, + { + "name": "model.layers.5.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.491961244137201e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006804433651268482, + "sensitivity": 0.545881503122309 + }, + { + "name": "model.layers.5.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.329336611088365e-05, + "sensitivity": 1.0075511456440052 + }, + { + "name": "model.layers.5.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.834799819444015e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007530195871368051, + "sensitivity": 0.5154840169960146 + }, + { + "name": "model.layers.5.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.605082697002217e-05, + "sensitivity": 0.7955405343898763 + }, + { + "name": "model.layers.5.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.295622370089404e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.029677751939744e-05, + "sensitivity": 0.6594708535753782 + }, + { + "name": "model.layers.5.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.260434126190376e-06, + "sensitivity": 1.6321710367623246 + }, + { + "name": "model.layers.5.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.53603456410201e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 4.891031130682677e-05, + "sensitivity": 0.7298765596884031 + }, + { + "name": "model.layers.5.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006408148328773677, + "sensitivity": 0.5253962529194666 + }, + { + "name": "model.layers.5.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.203899829415604e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006920511368662119, + "sensitivity": 0.5587104692515144 + }, + { + "name": "model.layers.5.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006581306224688888, + "sensitivity": 0.5502422445742864 + }, + { + "name": "model.layers.5.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.373737733156304e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007101836381480098, + "sensitivity": 0.5422364777205122 + }, + { + "name": "model.layers.5.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.924526340095326e-05, + "sensitivity": 0.7175679843428365 + }, + { + "name": "model.layers.5.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.334136628538545e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007063177181407809, + "sensitivity": 0.5203362484609253 + }, + { + "name": "model.layers.5.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.671524195349775e-05, + "sensitivity": 0.8008182676364874 + }, + { + "name": "model.layers.5.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.309321634034859e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006944822962395847, + "sensitivity": 0.5168646184662502 + }, + { + "name": "model.layers.5.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.702851194655523e-05, + "sensitivity": 0.679463559976049 + }, + { + "name": "model.layers.5.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.206001899045077e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006879428401589394, + "sensitivity": 0.5593631946767503 + }, + { + "name": "model.layers.5.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.646301360684447e-05, + "sensitivity": 1.0021351770682114 + }, + { + "name": "model.layers.5.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.195568289513176e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.922857599216513e-05, + "sensitivity": 0.6967542960491347 + }, + { + "name": "model.layers.5.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006509709055535495, + "sensitivity": 0.5423859156865167 + }, + { + "name": "model.layers.5.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.079944796510972e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006791597115807235, + "sensitivity": 0.539600425108096 + }, + { + "name": "model.layers.5.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6305507314391434e-05, + "sensitivity": 0.9211884975750875 + }, + { + "name": "model.layers.5.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.026019150340289e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006643926026299596, + "sensitivity": 0.5172849654929196 + }, + { + "name": "model.layers.5.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.77859282202553e-05, + "sensitivity": 0.7549833002091353 + }, + { + "name": "model.layers.5.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.586571998923318e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006818104302510619, + "sensitivity": 0.5349807192449223 + }, + { + "name": "model.layers.5.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.907707964070141e-05, + "sensitivity": 0.6574790652188588 + }, + { + "name": "model.layers.5.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.213359142748232e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006978644523769617, + "sensitivity": 0.5982525898963724 + }, + { + "name": "model.layers.5.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.580030119745061e-05, + "sensitivity": 0.7748379942589774 + }, + { + "name": "model.layers.5.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.89624733038363e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006567444070242345, + "sensitivity": 0.541440914901235 + }, + { + "name": "model.layers.5.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006629341514781117, + "sensitivity": 0.5304558146363014 + }, + { + "name": "model.layers.5.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.269876848818967e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007067201077006757, + "sensitivity": 0.5168499046006105 + }, + { + "name": "model.layers.5.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5823660659370944e-05, + "sensitivity": 0.6864141336217173 + }, + { + "name": "model.layers.5.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.477018246187072e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006932415417395532, + "sensitivity": 0.5659518007170097 + }, + { + "name": "model.layers.5.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0476388524693903e-05, + "sensitivity": 1.2095679327853468 + }, + { + "name": "model.layers.5.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.940011078564567e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006665707915090024, + "sensitivity": 0.5539298415861739 + }, + { + "name": "model.layers.5.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.00069728511152789, + "sensitivity": 0.515991068608581 + }, + { + "name": "model.layers.5.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.440546940211789e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007280634599737823, + "sensitivity": 0.5293168124723057 + }, + { + "name": "model.layers.5.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000653837516438216, + "sensitivity": 0.54288689908718 + }, + { + "name": "model.layers.5.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.920973080719705e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006751860491931438, + "sensitivity": 0.5221701424280901 + }, + { + "name": "model.layers.5.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006429021595977247, + "sensitivity": 0.5684686334327551 + }, + { + "name": "model.layers.5.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.96036727529281e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9974972828058526e-05, + "sensitivity": 0.7781045262221374 + }, + { + "name": "model.layers.5.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.555509414989501e-05, + "sensitivity": 0.9789941479521471 + }, + { + "name": "model.layers.5.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.478286991296045e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7846667914418504e-05, + "sensitivity": 0.6565027945488117 + }, + { + "name": "model.layers.5.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.553921073442325e-05, + "sensitivity": 0.6710317476266412 + }, + { + "name": "model.layers.5.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.006390549373464e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006742792902514338, + "sensitivity": 0.5234245461923936 + }, + { + "name": "model.layers.5.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.029563554766355e-05, + "sensitivity": 1.5892542250939614 + }, + { + "name": "model.layers.5.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.095878575251845e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006657556514255702, + "sensitivity": 0.556324773196202 + }, + { + "name": "model.layers.5.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.908549792366102e-05, + "sensitivity": 0.6664558343050853 + }, + { + "name": "model.layers.5.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.301902431005146e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.134063733043149e-05, + "sensitivity": 0.734975632915761 + }, + { + "name": "model.layers.5.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006507124635390937, + "sensitivity": 0.5654197298507033 + }, + { + "name": "model.layers.5.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.145363613541122e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006953277625143528, + "sensitivity": 0.5780345991652724 + }, + { + "name": "model.layers.5.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000635674805380404, + "sensitivity": 0.5918118877563743 + }, + { + "name": "model.layers.5.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.228787015061243e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006791693158447742, + "sensitivity": 0.535816339537792 + }, + { + "name": "model.layers.5.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.716276791645214e-05, + "sensitivity": 0.787391963237162 + }, + { + "name": "model.layers.5.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.880636990696075e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.029927681083791e-05, + "sensitivity": 0.6125050699529027 + }, + { + "name": "model.layers.5.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006542237242683768, + "sensitivity": 0.5257367007978292 + }, + { + "name": "model.layers.5.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.196625008669798e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006931214011274278, + "sensitivity": 0.5145138811849617 + }, + { + "name": "model.layers.5.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.656527355313301e-05, + "sensitivity": 0.6811943924738636 + }, + { + "name": "model.layers.5.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.200555162649835e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.873247209819965e-05, + "sensitivity": 0.6020323996354071 + }, + { + "name": "model.layers.5.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3241787099977955e-05, + "sensitivity": 1.1338179137785596 + }, + { + "name": "model.layers.5.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.613159146378166e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000610903836786747, + "sensitivity": 0.5718141096041045 + }, + { + "name": "model.layers.5.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.801324005005881e-05, + "sensitivity": 0.612484346857023 + }, + { + "name": "model.layers.5.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.292070793278981e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.976529064355418e-05, + "sensitivity": 0.9273112634952105 + }, + { + "name": "model.layers.5.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.864018385182135e-05, + "sensitivity": 0.7857327125953946 + }, + { + "name": "model.layers.5.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.289542398008052e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007019054028205574, + "sensitivity": 0.5346692669026316 + }, + { + "name": "model.layers.5.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7246070355176926e-05, + "sensitivity": 0.6343480853423501 + }, + { + "name": "model.layers.5.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.344206440189737e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006717690266668797, + "sensitivity": 0.5292566951553956 + }, + { + "name": "model.layers.5.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.837646313011646e-05, + "sensitivity": 0.7265412878152719 + }, + { + "name": "model.layers.5.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.604503823837149e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000697412877343595, + "sensitivity": 0.5925325553723992 + }, + { + "name": "model.layers.5.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006463145255111158, + "sensitivity": 0.5488669948915348 + }, + { + "name": "model.layers.5.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.012177209413494e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000682407699059695, + "sensitivity": 0.5244532954282681 + }, + { + "name": "model.layers.5.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.2830815548077226e-05, + "sensitivity": 0.7663910631837445 + }, + { + "name": "model.layers.5.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.597265726464684e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006347924936562777, + "sensitivity": 0.5088161255018706 + }, + { + "name": "model.layers.5.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006716195493936539, + "sensitivity": 0.5396696316802261 + }, + { + "name": "model.layers.5.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.201529458849109e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007049547275528312, + "sensitivity": 0.5411393825692137 + }, + { + "name": "model.layers.5.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.735183003707789e-05, + "sensitivity": 0.6703659877324708 + }, + { + "name": "model.layers.5.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.314721190392447e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007044244557619095, + "sensitivity": 0.5172087733663017 + }, + { + "name": "model.layers.5.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4064392315922305e-05, + "sensitivity": 0.6419389805097342 + }, + { + "name": "model.layers.5.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.894686978535901e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006561823538504541, + "sensitivity": 0.5510746407303759 + }, + { + "name": "model.layers.5.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000687027582898736, + "sensitivity": 0.5375959837789887 + }, + { + "name": "model.layers.5.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.399092171704979e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000719776377081871, + "sensitivity": 0.5337910396441834 + }, + { + "name": "model.layers.5.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.596328264800832e-05, + "sensitivity": 0.8432147504930958 + }, + { + "name": "model.layers.5.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.925926416239236e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006601737695746124, + "sensitivity": 0.5082670036480471 + }, + { + "name": "model.layers.5.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.434603008325212e-05, + "sensitivity": 0.7519967508570867 + }, + { + "name": "model.layers.5.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.729173153667944e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006471384549513459, + "sensitivity": 0.5674974044724468 + }, + { + "name": "model.layers.5.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.743532528867945e-05, + "sensitivity": 0.7210069684863524 + }, + { + "name": "model.layers.5.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.20418347807572e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.957320536253974e-05, + "sensitivity": 0.944383109278147 + }, + { + "name": "model.layers.5.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.49894092627801e-06, + "sensitivity": 1.4650584383291423 + }, + { + "name": "model.layers.5.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.308693289407529e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006015264661982656, + "sensitivity": 0.5255526858640602 + }, + { + "name": "model.layers.5.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.362502270145342e-05, + "sensitivity": 0.7566271527572925 + }, + { + "name": "model.layers.5.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.930090765104978e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006570519763045013, + "sensitivity": 0.5144489605770642 + }, + { + "name": "model.layers.5.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.573302769334987e-05, + "sensitivity": 0.7258019505556463 + }, + { + "name": "model.layers.5.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.769873041572282e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006574344588443637, + "sensitivity": 0.5264402729860789 + }, + { + "name": "model.layers.5.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006444156169891357, + "sensitivity": 0.5681259950445033 + }, + { + "name": "model.layers.5.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.934213618274953e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.00707862759009e-05, + "sensitivity": 0.6244539378251253 + }, + { + "name": "model.layers.5.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.686370423063636e-05, + "sensitivity": 0.6800411359730371 + }, + { + "name": "model.layers.5.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.917224825680023e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006606096867471933, + "sensitivity": 0.5469396662930713 + }, + { + "name": "model.layers.5.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3335090342443436e-05, + "sensitivity": 0.6839447914009902 + }, + { + "name": "model.layers.5.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.89446699450491e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.844645056640729e-05, + "sensitivity": 0.6789151255553665 + }, + { + "name": "model.layers.5.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.313480505719781e-05, + "sensitivity": 0.8584333073414157 + }, + { + "name": "model.layers.5.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.694774927178514e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006270682788453996, + "sensitivity": 0.5300546855743993 + }, + { + "name": "model.layers.5.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.604553734883666e-05, + "sensitivity": 0.6272113452550139 + }, + { + "name": "model.layers.5.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.172410280669283e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006582462228834629, + "sensitivity": 0.510560418248403 + }, + { + "name": "model.layers.5.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5765056458767503e-05, + "sensitivity": 0.7189735787208792 + }, + { + "name": "model.layers.5.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.850014304087381e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006653275340795517, + "sensitivity": 0.5232196949510948 + }, + { + "name": "model.layers.5.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.578563650487922e-05, + "sensitivity": 1.0818392452655214 + }, + { + "name": "model.layers.5.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.973244583401538e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006656750338152051, + "sensitivity": 0.5284393022162583 + }, + { + "name": "model.layers.5.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4715397709514946e-05, + "sensitivity": 1.1575811033805428 + }, + { + "name": "model.layers.5.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.734704586757289e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.585952749243006e-05, + "sensitivity": 0.6698928650932614 + }, + { + "name": "model.layers.5.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.115920405136421e-05, + "sensitivity": 0.9585933714760068 + }, + { + "name": "model.layers.5.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.284325877459196e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.330998439807445e-05, + "sensitivity": 0.6000029916787292 + }, + { + "name": "model.layers.5.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.215398778091185e-05, + "sensitivity": 0.7472831733199926 + }, + { + "name": "model.layers.5.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.608684432445443e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006313082994893193, + "sensitivity": 0.5473204568801391 + }, + { + "name": "model.layers.5.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.805590990348719e-05, + "sensitivity": 0.8599827505317831 + }, + { + "name": "model.layers.5.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.342478400256368e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.303254485828802e-05, + "sensitivity": 0.9845943170226459 + }, + { + "name": "model.layers.5.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3094069092621794e-06, + "sensitivity": 2.0972684463764555 + }, + { + "name": "model.layers.5.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.186810423969291e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.1210961019969545e-05, + "sensitivity": 1.2071490709379562 + }, + { + "name": "model.layers.5.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 9.185856470139697e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.7325196495221462e-06, + "sensitivity": 2.098507133975826 + }, + { + "name": "model.layers.5.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0104139391842182e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.5.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.3220778782851994e-06, + "sensitivity": 2.102846579004364 + }, + { + "name": "model.layers.5.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 5.372161467676051e-06, + "sensitivity": 2.1550550172764646 + }, + { + "name": "model.layers.5.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.0001751558593241498, + "sensitivity": 1.179238173833278 + }, + { + "name": "model.layers.5.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 9.56397252593888e-06, + "sensitivity": 1.8177267036929416 + }, + { + "name": "model.layers.5.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 2, + "mse": 0.0005624552140943706, + "sensitivity": 0.5275247361843922 + }, + { + "name": "model.layers.5.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002904439461417496, + "sensitivity": 1.0437565429407842 + }, + { + "name": "model.layers.6.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006554018473252654, + "sensitivity": 0.5322259067099371 + }, + { + "name": "model.layers.6.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.044321025910904e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006911138771101832, + "sensitivity": 0.5541707118329273 + }, + { + "name": "model.layers.6.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.313691508490592e-05, + "sensitivity": 1.1504621314023844 + }, + { + "name": "model.layers.6.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.754645826527849e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006393723888322711, + "sensitivity": 0.5836531099395504 + }, + { + "name": "model.layers.6.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000657164491713047, + "sensitivity": 0.5740225757954931 + }, + { + "name": "model.layers.6.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.469273898801475e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007232431089505553, + "sensitivity": 0.5019334423065391 + }, + { + "name": "model.layers.6.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0180729077546857e-05, + "sensitivity": 1.3075928298156805 + }, + { + "name": "model.layers.6.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.936708132343483e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006528365192934871, + "sensitivity": 0.5297076561069719 + }, + { + "name": "model.layers.6.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.565343235502951e-05, + "sensitivity": 0.7201308727265029 + }, + { + "name": "model.layers.6.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.929150006522832e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006655083852820098, + "sensitivity": 0.5398736213827701 + }, + { + "name": "model.layers.6.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006868256605230272, + "sensitivity": 0.519030146800292 + }, + { + "name": "model.layers.6.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.453734613387496e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007280096760950983, + "sensitivity": 0.5254971861095359 + }, + { + "name": "model.layers.6.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.830052396049723e-05, + "sensitivity": 0.6540282437817707 + }, + { + "name": "model.layers.6.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.966799108136911e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006757627124898136, + "sensitivity": 0.5482891702613181 + }, + { + "name": "model.layers.6.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.77673563384451e-05, + "sensitivity": 0.9741345558962546 + }, + { + "name": "model.layers.6.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.235218279471155e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006719117518514395, + "sensitivity": 0.5577829679811837 + }, + { + "name": "model.layers.6.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0213829227723181e-05, + "sensitivity": 1.4861117726056752 + }, + { + "name": "model.layers.6.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.984256515352172e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.011313234921545e-05, + "sensitivity": 0.8173159094697566 + }, + { + "name": "model.layers.6.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6362623581662774e-05, + "sensitivity": 0.9968345576375092 + }, + { + "name": "model.layers.6.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.013241318214568e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006609484553337097, + "sensitivity": 0.5586074782808822 + }, + { + "name": "model.layers.6.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.694651554222219e-05, + "sensitivity": 0.6020355788342076 + }, + { + "name": "model.layers.6.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.179500360303791e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007028586114756763, + "sensitivity": 0.5413638404227371 + }, + { + "name": "model.layers.6.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5556942243129015e-05, + "sensitivity": 0.820427356341269 + }, + { + "name": "model.layers.6.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.890008196729468e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006654657190665603, + "sensitivity": 0.5257731627154053 + }, + { + "name": "model.layers.6.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.626984057016671e-05, + "sensitivity": 0.8588157248540575 + }, + { + "name": "model.layers.6.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.207333171914797e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006917174905538559, + "sensitivity": 0.5284698706145263 + }, + { + "name": "model.layers.6.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.419144144980237e-05, + "sensitivity": 1.1337131833487177 + }, + { + "name": "model.layers.6.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.86152282266994e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006482896278612316, + "sensitivity": 0.5481658534158259 + }, + { + "name": "model.layers.6.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.694383798982017e-05, + "sensitivity": 0.6281391973043511 + }, + { + "name": "model.layers.6.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.640837343889871e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006447023479267955, + "sensitivity": 0.527591806791504 + }, + { + "name": "model.layers.6.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.457294173538685e-05, + "sensitivity": 0.7064950473669898 + }, + { + "name": "model.layers.6.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.727168854718911e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006333797937259078, + "sensitivity": 0.5364980987689366 + }, + { + "name": "model.layers.6.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0000441761803813e-05, + "sensitivity": 1.2751642967599524 + }, + { + "name": "model.layers.6.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.555439995281631e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.0630456017679535e-05, + "sensitivity": 1.2249667298009408 + }, + { + "name": "model.layers.6.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.912419146625325e-05, + "sensitivity": 1.0389221255457723 + }, + { + "name": "model.layers.6.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.088516215640993e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006984553183428943, + "sensitivity": 0.5285616740386496 + }, + { + "name": "model.layers.6.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006383167929016054, + "sensitivity": 0.5639585703445329 + }, + { + "name": "model.layers.6.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.091443651712325e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006784825818613172, + "sensitivity": 0.5501404759866451 + }, + { + "name": "model.layers.6.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.370170038077049e-05, + "sensitivity": 0.733994129798322 + }, + { + "name": "model.layers.6.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.828340476909943e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006538236048072577, + "sensitivity": 0.5431231251981703 + }, + { + "name": "model.layers.6.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0326089977752417e-05, + "sensitivity": 1.4977216942356018 + }, + { + "name": "model.layers.6.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.823808351124171e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006560046458616853, + "sensitivity": 0.5076706554567496 + }, + { + "name": "model.layers.6.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0339149058563635e-05, + "sensitivity": 0.7162884799869463 + }, + { + "name": "model.layers.6.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.269820005400106e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007013003341853619, + "sensitivity": 0.5178252041083931 + }, + { + "name": "model.layers.6.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006524806376546621, + "sensitivity": 0.5374168813636166 + }, + { + "name": "model.layers.6.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.919238788010261e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000682905490975827, + "sensitivity": 0.524269699434542 + }, + { + "name": "model.layers.6.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6832825066521764e-05, + "sensitivity": 0.9280927405690907 + }, + { + "name": "model.layers.6.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.225106972124195e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006909620715305209, + "sensitivity": 0.5305612992119594 + }, + { + "name": "model.layers.6.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3570511227007955e-05, + "sensitivity": 1.132196602487088 + }, + { + "name": "model.layers.6.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.716884174944425e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006345995934680104, + "sensitivity": 0.5375532804240135 + }, + { + "name": "model.layers.6.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0937159458990209e-05, + "sensitivity": 1.7507448239850112 + }, + { + "name": "model.layers.6.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.301999633251398e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007088084239512682, + "sensitivity": 0.5321531900838443 + }, + { + "name": "model.layers.6.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.553107621381059e-05, + "sensitivity": 0.7784711585086197 + }, + { + "name": "model.layers.6.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.178356670716312e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006693013710901141, + "sensitivity": 0.5228456258546624 + }, + { + "name": "model.layers.6.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.487708403961733e-05, + "sensitivity": 0.7568763462491285 + }, + { + "name": "model.layers.6.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.931458417762769e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006566282245330513, + "sensitivity": 0.5339737452275339 + }, + { + "name": "model.layers.6.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006470398511737585, + "sensitivity": 0.5578504382031609 + }, + { + "name": "model.layers.6.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.054380037312512e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006846371106803417, + "sensitivity": 0.5201100449394973 + }, + { + "name": "model.layers.6.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7614735851529986e-05, + "sensitivity": 0.9849311333229777 + }, + { + "name": "model.layers.6.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.306955810941872e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.031420343788341e-05, + "sensitivity": 0.623568544442872 + }, + { + "name": "model.layers.6.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.880229582544416e-05, + "sensitivity": 0.8209464388676091 + }, + { + "name": "model.layers.6.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.233018439161242e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007049901178106666, + "sensitivity": 0.5138082631252385 + }, + { + "name": "model.layers.6.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5708449508529156e-05, + "sensitivity": 0.8073737087595007 + }, + { + "name": "model.layers.6.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.222611546036205e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000673370435833931, + "sensitivity": 0.5701522969928297 + }, + { + "name": "model.layers.6.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.498591053765267e-05, + "sensitivity": 0.6405688580230897 + }, + { + "name": "model.layers.6.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.075684382267355e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006615861784666777, + "sensitivity": 0.5269150957024943 + }, + { + "name": "model.layers.6.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4644286137772724e-05, + "sensitivity": 0.9695087254359768 + }, + { + "name": "model.layers.6.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.750279115090962e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006405391031876206, + "sensitivity": 0.5251737866005454 + }, + { + "name": "model.layers.6.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.950443301117048e-05, + "sensitivity": 0.8385405137928128 + }, + { + "name": "model.layers.6.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.073083795854473e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006922497414052486, + "sensitivity": 0.5444900050838899 + }, + { + "name": "model.layers.6.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.785828034277074e-05, + "sensitivity": 1.055375458936517 + }, + { + "name": "model.layers.6.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.963331091152213e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006777415401302278, + "sensitivity": 0.5340883278341996 + }, + { + "name": "model.layers.6.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0380054492270574e-05, + "sensitivity": 1.0292258736710809 + }, + { + "name": "model.layers.6.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.362626550071582e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007096345070749521, + "sensitivity": 0.5143366618039594 + }, + { + "name": "model.layers.6.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.340871211956255e-05, + "sensitivity": 0.9863218151020383 + }, + { + "name": "model.layers.6.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.395532068381726e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6876531743910164e-05, + "sensitivity": 0.6060369892020345 + }, + { + "name": "model.layers.6.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006280107190832496, + "sensitivity": 0.5775759466860291 + }, + { + "name": "model.layers.6.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.714584858651506e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006474937545135617, + "sensitivity": 0.5319294029995575 + }, + { + "name": "model.layers.6.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006430996581912041, + "sensitivity": 0.5406266256930873 + }, + { + "name": "model.layers.6.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.015056328578794e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006772935157641768, + "sensitivity": 0.5877906475182323 + }, + { + "name": "model.layers.6.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.710066034225747e-05, + "sensitivity": 0.7471953289717292 + }, + { + "name": "model.layers.6.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.102657152950997e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000695804541464895, + "sensitivity": 0.5094190887003807 + }, + { + "name": "model.layers.6.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.48322859685868e-05, + "sensitivity": 0.6224332152129305 + }, + { + "name": "model.layers.6.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.083286621105799e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006729968590661883, + "sensitivity": 0.52705711665244 + }, + { + "name": "model.layers.6.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9344456531107426e-05, + "sensitivity": 0.8243890275146544 + }, + { + "name": "model.layers.6.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.108183470132644e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.217225745785981e-05, + "sensitivity": 0.7626473875928069 + }, + { + "name": "model.layers.6.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006600222550332546, + "sensitivity": 0.5869058986582536 + }, + { + "name": "model.layers.6.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.248729960134369e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007126370328478515, + "sensitivity": 0.5391390231611126 + }, + { + "name": "model.layers.6.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.878698620013893e-06, + "sensitivity": 1.4005742678135402 + }, + { + "name": "model.layers.6.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.750721356889699e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006429735803976655, + "sensitivity": 0.518499441667112 + }, + { + "name": "model.layers.6.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9441354096634313e-05, + "sensitivity": 0.9900358644197229 + }, + { + "name": "model.layers.6.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.228361826288165e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000695324910338968, + "sensitivity": 0.5535241560125183 + }, + { + "name": "model.layers.6.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.2797717216890305e-05, + "sensitivity": 0.7821601836766932 + }, + { + "name": "model.layers.6.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.645305805046519e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006292031612247229, + "sensitivity": 0.5317107109072646 + }, + { + "name": "model.layers.6.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.70462980249431e-05, + "sensitivity": 0.7843891851529493 + }, + { + "name": "model.layers.6.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.127181677584304e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.035942351445556e-05, + "sensitivity": 0.7552309681678469 + }, + { + "name": "model.layers.6.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.701258123735897e-05, + "sensitivity": 0.777322376773594 + }, + { + "name": "model.layers.6.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.342977485473966e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006784155848436058, + "sensitivity": 0.5453614732023868 + }, + { + "name": "model.layers.6.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.104051135480404e-05, + "sensitivity": 0.6552720376763157 + }, + { + "name": "model.layers.6.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.449205329772667e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007276737014763057, + "sensitivity": 0.5359690795662718 + }, + { + "name": "model.layers.6.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4772041039541364e-05, + "sensitivity": 0.7795287821969561 + }, + { + "name": "model.layers.6.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.916089094171184e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006677813362330198, + "sensitivity": 0.5100133354152152 + }, + { + "name": "model.layers.6.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006660979706794024, + "sensitivity": 0.5313935921410139 + }, + { + "name": "model.layers.6.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.150789886305574e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006914662080816925, + "sensitivity": 0.5266513399673843 + }, + { + "name": "model.layers.6.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.164110189070925e-05, + "sensitivity": 1.1958459195665665 + }, + { + "name": "model.layers.6.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.426354618975893e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.351617801352404e-05, + "sensitivity": 0.622156211956137 + }, + { + "name": "model.layers.6.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.663411502609961e-05, + "sensitivity": 0.7844660401844595 + }, + { + "name": "model.layers.6.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.103801410972665e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006890061195008457, + "sensitivity": 0.5180957369779712 + }, + { + "name": "model.layers.6.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.890367538086139e-05, + "sensitivity": 0.8524389334413824 + }, + { + "name": "model.layers.6.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.897919320181245e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.284908158704638e-05, + "sensitivity": 0.9959739133078523 + }, + { + "name": "model.layers.6.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8093206462217495e-05, + "sensitivity": 0.9243585035991819 + }, + { + "name": "model.layers.6.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.171907216412365e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006913856486789882, + "sensitivity": 0.5103035851714822 + }, + { + "name": "model.layers.6.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0311521691619419e-05, + "sensitivity": 1.314706545458852 + }, + { + "name": "model.layers.6.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.090200486141839e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9573583712335676e-05, + "sensitivity": 0.9498941371847344 + }, + { + "name": "model.layers.6.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006669365102425218, + "sensitivity": 0.5035688116671737 + }, + { + "name": "model.layers.6.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.172177791086142e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00070140918251127, + "sensitivity": 0.5065843335969656 + }, + { + "name": "model.layers.6.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.02882937528193e-05, + "sensitivity": 0.8835380925921081 + }, + { + "name": "model.layers.6.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.205243039403285e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007065918180160224, + "sensitivity": 0.5184654004137565 + }, + { + "name": "model.layers.6.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7779743656283244e-05, + "sensitivity": 0.9903254808522901 + }, + { + "name": "model.layers.6.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.340029585771845e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.092302646720782e-05, + "sensitivity": 0.6699571374582189 + }, + { + "name": "model.layers.6.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.622508979286067e-05, + "sensitivity": 0.9817457293655094 + }, + { + "name": "model.layers.6.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.984146239119582e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.988773045828566e-05, + "sensitivity": 0.8908818072382368 + }, + { + "name": "model.layers.6.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.633967521134764e-05, + "sensitivity": 0.6377902469572438 + }, + { + "name": "model.layers.6.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.733494958803931e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006563730421476066, + "sensitivity": 0.551345801704431 + }, + { + "name": "model.layers.6.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006390023627318442, + "sensitivity": 0.5212106278020271 + }, + { + "name": "model.layers.6.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.995547098791576e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006774008506909013, + "sensitivity": 0.5079884126487787 + }, + { + "name": "model.layers.6.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.43172427569516e-05, + "sensitivity": 1.182943807113232 + }, + { + "name": "model.layers.6.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.889531848879415e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006475000409409404, + "sensitivity": 0.5494417532154581 + }, + { + "name": "model.layers.6.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 9.630176464270335e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.964664534170879e-06, + "sensitivity": 2.099288426383133 + }, + { + "name": "model.layers.6.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.62519925703964e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.6.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.3236229960966739e-06, + "sensitivity": 2.10155937077606 + }, + { + "name": "model.layers.6.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 8.352782970177941e-06, + "sensitivity": 2.148186083435637 + }, + { + "name": "model.layers.6.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.0001912114821607247, + "sensitivity": 0.9471759698748046 + }, + { + "name": "model.layers.6.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.195357344840886e-05, + "sensitivity": 1.7497405766493983 + }, + { + "name": "model.layers.6.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 2, + "mse": 0.0005293141584843397, + "sensitivity": 0.5548273876801484 + }, + { + "name": "model.layers.6.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0003165740636177361, + "sensitivity": 0.7335503835102731 + }, + { + "name": "model.layers.7.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006285854615271091, + "sensitivity": 0.5310993728027205 + }, + { + "name": "model.layers.7.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.447576197388116e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006641258951276541, + "sensitivity": 0.5080962802791482 + }, + { + "name": "model.layers.7.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006640524370595813, + "sensitivity": 0.5782057171300815 + }, + { + "name": "model.layers.7.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.376430974341929e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006968459929339588, + "sensitivity": 0.5164425281865961 + }, + { + "name": "model.layers.7.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7069682952715084e-05, + "sensitivity": 0.8975566990839071 + }, + { + "name": "model.layers.7.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.024205158108089e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9771304222522303e-05, + "sensitivity": 0.8117419753727988 + }, + { + "name": "model.layers.7.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006029325304552913, + "sensitivity": 0.5764435035328658 + }, + { + "name": "model.layers.7.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.068990501262306e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006262838141992688, + "sensitivity": 0.5369736942721245 + }, + { + "name": "model.layers.7.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006223347736522555, + "sensitivity": 0.5499916206014084 + }, + { + "name": "model.layers.7.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.320382794910984e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006522891926579177, + "sensitivity": 0.5161741146764348 + }, + { + "name": "model.layers.7.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.621020682156086e-05, + "sensitivity": 0.6750991206741357 + }, + { + "name": "model.layers.7.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.090490387578029e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000662352133076638, + "sensitivity": 0.5616967397200032 + }, + { + "name": "model.layers.7.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0005698543973267078, + "sensitivity": 0.515806391900241 + }, + { + "name": "model.layers.7.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.74806222175539e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005827447166666389, + "sensitivity": 0.5205471550745862 + }, + { + "name": "model.layers.7.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006065201014280319, + "sensitivity": 0.5257249701852521 + }, + { + "name": "model.layers.7.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.425466381188016e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006201675860211253, + "sensitivity": 0.511119882041758 + }, + { + "name": "model.layers.7.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006469734362326562, + "sensitivity": 0.5593799943639299 + }, + { + "name": "model.layers.7.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.785537950941944e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.836343552800827e-05, + "sensitivity": 0.6318491492464338 + }, + { + "name": "model.layers.7.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.442996189231053e-05, + "sensitivity": 0.745233893538501 + }, + { + "name": "model.layers.7.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.126750460884068e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006572717684321105, + "sensitivity": 0.5149819813909353 + }, + { + "name": "model.layers.7.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3967873100191355e-05, + "sensitivity": 0.6156906464052111 + }, + { + "name": "model.layers.7.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.125473532847536e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000627335102763027, + "sensitivity": 0.535252967386026 + }, + { + "name": "model.layers.7.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.757100734626874e-05, + "sensitivity": 0.8761712667416477 + }, + { + "name": "model.layers.7.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.041139499757264e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.930274710408412e-05, + "sensitivity": 0.9952726601827502 + }, + { + "name": "model.layers.7.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.905101716052741e-05, + "sensitivity": 0.8879450170409352 + }, + { + "name": "model.layers.7.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.086734174459707e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000679867691360414, + "sensitivity": 0.5254144425744017 + }, + { + "name": "model.layers.7.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3572577598970383e-05, + "sensitivity": 0.9633124593086229 + }, + { + "name": "model.layers.7.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.097706659602409e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006082457257434726, + "sensitivity": 0.5193063007857501 + }, + { + "name": "model.layers.7.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006285907002165914, + "sensitivity": 0.5633618944599837 + }, + { + "name": "model.layers.7.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.27945212272607e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000658623524941504, + "sensitivity": 0.5184510081125105 + }, + { + "name": "model.layers.7.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.320418858900666e-05, + "sensitivity": 0.7741428341314598 + }, + { + "name": "model.layers.7.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.202477038641518e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006198523915372789, + "sensitivity": 0.5227557037997002 + }, + { + "name": "model.layers.7.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006607719697058201, + "sensitivity": 0.5452936589513004 + }, + { + "name": "model.layers.7.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.224267394827621e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000685474369674921, + "sensitivity": 0.5473994170091947 + }, + { + "name": "model.layers.7.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006232651649042964, + "sensitivity": 0.5216011769475168 + }, + { + "name": "model.layers.7.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.708109256374883e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006373918149620295, + "sensitivity": 0.5332486671927286 + }, + { + "name": "model.layers.7.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006178590701892972, + "sensitivity": 0.5356794477236101 + }, + { + "name": "model.layers.7.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.91638467994926e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006372565403580666, + "sensitivity": 0.5110441525481961 + }, + { + "name": "model.layers.7.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006563399801962078, + "sensitivity": 0.5305169593599866 + }, + { + "name": "model.layers.7.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.22909453795728e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006735686911270022, + "sensitivity": 0.5718369576604401 + }, + { + "name": "model.layers.7.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006305986316874623, + "sensitivity": 0.5407849120417311 + }, + { + "name": "model.layers.7.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.784040920138068e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006973372073844075, + "sensitivity": 0.536066120320605 + }, + { + "name": "model.layers.7.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.2947936637792736e-05, + "sensitivity": 0.7120341009212721 + }, + { + "name": "model.layers.7.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.748214562117937e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006042728200554848, + "sensitivity": 0.598791782775763 + }, + { + "name": "model.layers.7.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.00067484425380826, + "sensitivity": 0.5215289497863066 + }, + { + "name": "model.layers.7.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.100860900914995e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006893902900628746, + "sensitivity": 0.5142864567494745 + }, + { + "name": "model.layers.7.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0694492276525125e-05, + "sensitivity": 0.8798884148767407 + }, + { + "name": "model.layers.7.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.28857151241391e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006994563154876232, + "sensitivity": 0.5062024609965204 + }, + { + "name": "model.layers.7.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006136137526482344, + "sensitivity": 0.5250660870440428 + }, + { + "name": "model.layers.7.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.944368695054436e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006413794471882284, + "sensitivity": 0.532511765117314 + }, + { + "name": "model.layers.7.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006245156982913613, + "sensitivity": 0.5549763933628472 + }, + { + "name": "model.layers.7.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.02846114361455e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006381713901646435, + "sensitivity": 0.5765319853734985 + }, + { + "name": "model.layers.7.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006523056654259562, + "sensitivity": 0.5394926827956099 + }, + { + "name": "model.layers.7.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.022107186254289e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006677209166809916, + "sensitivity": 0.5081719791904447 + }, + { + "name": "model.layers.7.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.2672676247311756e-05, + "sensitivity": 0.7023803996417274 + }, + { + "name": "model.layers.7.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.966178378002951e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000613968470133841, + "sensitivity": 0.509538924474834 + }, + { + "name": "model.layers.7.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9514917666092515e-05, + "sensitivity": 0.9466116829131508 + }, + { + "name": "model.layers.7.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.922008424226078e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.293143087532371e-05, + "sensitivity": 0.9357820668990922 + }, + { + "name": "model.layers.7.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4547588661080226e-05, + "sensitivity": 0.6810597278357804 + }, + { + "name": "model.layers.7.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.753337291025673e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006251310696825385, + "sensitivity": 0.5427773139220692 + }, + { + "name": "model.layers.7.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006676516495645046, + "sensitivity": 0.5097786040760139 + }, + { + "name": "model.layers.7.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.105659622335224e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006871768273413181, + "sensitivity": 0.5393581981447233 + }, + { + "name": "model.layers.7.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006878719432279468, + "sensitivity": 0.5412768239939789 + }, + { + "name": "model.layers.7.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.376246233230631e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007092603482306004, + "sensitivity": 0.5460815960660529 + }, + { + "name": "model.layers.7.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006594952428713441, + "sensitivity": 0.5409136938806953 + }, + { + "name": "model.layers.7.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.183691994010587e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006779811228625476, + "sensitivity": 0.5394284544783012 + }, + { + "name": "model.layers.7.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006077652797102928, + "sensitivity": 0.5681887768135615 + }, + { + "name": "model.layers.7.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.937930609434261e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006304677808657289, + "sensitivity": 0.5626774963479028 + }, + { + "name": "model.layers.7.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000583465036470443, + "sensitivity": 0.5310164411986447 + }, + { + "name": "model.layers.7.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.941923291175044e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005987006006762385, + "sensitivity": 0.5157500709252083 + }, + { + "name": "model.layers.7.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006480964366346598, + "sensitivity": 0.5532745676280008 + }, + { + "name": "model.layers.7.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.923961907683406e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006657079793512821, + "sensitivity": 0.5043441267885894 + }, + { + "name": "model.layers.7.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0005948141915723681, + "sensitivity": 0.5343164205993178 + }, + { + "name": "model.layers.7.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.224989874681341e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006149043329060078, + "sensitivity": 0.5055429558804372 + }, + { + "name": "model.layers.7.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006247260607779026, + "sensitivity": 0.5251525898222954 + }, + { + "name": "model.layers.7.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.080761636440002e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006448737112805247, + "sensitivity": 0.5026840189912501 + }, + { + "name": "model.layers.7.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000691444322001189, + "sensitivity": 0.5196842547104007 + }, + { + "name": "model.layers.7.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.321248520180234e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007137682987377048, + "sensitivity": 0.5210010515283658 + }, + { + "name": "model.layers.7.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.530188718694262e-05, + "sensitivity": 0.9902766845988619 + }, + { + "name": "model.layers.7.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.122626245996798e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.0459024451847654e-05, + "sensitivity": 1.3938075003891899 + }, + { + "name": "model.layers.7.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.262839113129303e-05, + "sensitivity": 0.8447448845819387 + }, + { + "name": "model.layers.7.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.046453672250209e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7180150179192424e-05, + "sensitivity": 0.6123032511132258 + }, + { + "name": "model.layers.7.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.180983397527598e-06, + "sensitivity": 1.6384968360111527 + }, + { + "name": "model.layers.7.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.981732217856916e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 4.899902705801651e-05, + "sensitivity": 0.6367923889416511 + }, + { + "name": "model.layers.7.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0005781640065833926, + "sensitivity": 0.5694742991825216 + }, + { + "name": "model.layers.7.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.534957037729328e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006030923686921597, + "sensitivity": 0.543575286001677 + }, + { + "name": "model.layers.7.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006182952784001827, + "sensitivity": 0.5119318748700965 + }, + { + "name": "model.layers.7.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.175154680931882e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006352817872539163, + "sensitivity": 0.5053912596767034 + }, + { + "name": "model.layers.7.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006501011084765196, + "sensitivity": 0.5807559347150961 + }, + { + "name": "model.layers.7.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.200350526341936e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006893409881740808, + "sensitivity": 0.547014743154823 + }, + { + "name": "model.layers.7.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.223013770068064e-05, + "sensitivity": 0.7655969219435699 + }, + { + "name": "model.layers.7.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.577503768312454e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.473549001384526e-05, + "sensitivity": 0.7149468640836616 + }, + { + "name": "model.layers.7.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006258563371375203, + "sensitivity": 0.5614970477110153 + }, + { + "name": "model.layers.7.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.327466053335229e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006608895491808653, + "sensitivity": 0.5059851314193357 + }, + { + "name": "model.layers.7.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 4.9284688429906964e-05, + "sensitivity": 0.6242470071276273 + }, + { + "name": "model.layers.7.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.758804491051706e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005810059374198318, + "sensitivity": 0.5304641882622053 + }, + { + "name": "model.layers.7.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006409158231690526, + "sensitivity": 0.52007242752223 + }, + { + "name": "model.layers.7.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.767709012616251e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006499758455902338, + "sensitivity": 0.5470332531456726 + }, + { + "name": "model.layers.7.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006489385850727558, + "sensitivity": 0.5341065266454442 + }, + { + "name": "model.layers.7.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.824073241456063e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006563173374161124, + "sensitivity": 0.5184510587649622 + }, + { + "name": "model.layers.7.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0005940558621659875, + "sensitivity": 0.564641868464315 + }, + { + "name": "model.layers.7.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.878320052943309e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006118664750829339, + "sensitivity": 0.516188361481141 + }, + { + "name": "model.layers.7.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.670772952726111e-05, + "sensitivity": 0.8239068891397434 + }, + { + "name": "model.layers.7.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.631792868778575e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.916252848692238e-05, + "sensitivity": 0.8230172959609515 + }, + { + "name": "model.layers.7.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.515339944395237e-05, + "sensitivity": 0.7256142963450841 + }, + { + "name": "model.layers.7.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.010852189319849e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006432951777242124, + "sensitivity": 0.5719986801814403 + }, + { + "name": "model.layers.7.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.807237175758928e-05, + "sensitivity": 0.9559897274926421 + }, + { + "name": "model.layers.7.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.611430194425338e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.170984852360561e-05, + "sensitivity": 0.6882206994915674 + }, + { + "name": "model.layers.7.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006209976854734123, + "sensitivity": 0.5993704581952555 + }, + { + "name": "model.layers.7.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.899096322536934e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006341019761748612, + "sensitivity": 0.5154432044515128 + }, + { + "name": "model.layers.7.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.334527668310329e-05, + "sensitivity": 0.9363057021416219 + }, + { + "name": "model.layers.7.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.149631417429191e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006283801048994064, + "sensitivity": 0.5856551437308297 + }, + { + "name": "model.layers.7.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006587802199646831, + "sensitivity": 0.5210429953967187 + }, + { + "name": "model.layers.7.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.843808139616158e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006650366703979671, + "sensitivity": 0.5137982146963058 + }, + { + "name": "model.layers.7.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.1963605073979124e-05, + "sensitivity": 0.7718800756993212 + }, + { + "name": "model.layers.7.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.133323608992214e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006031547673046589, + "sensitivity": 0.5286565722351834 + }, + { + "name": "model.layers.7.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006020166911184788, + "sensitivity": 0.533673197915718 + }, + { + "name": "model.layers.7.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.058327812752395e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006213050801306963, + "sensitivity": 0.5524937455667661 + }, + { + "name": "model.layers.7.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0005951565690338612, + "sensitivity": 0.5416044331236166 + }, + { + "name": "model.layers.7.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.130318297437043e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006094466662034392, + "sensitivity": 0.5632248810922657 + }, + { + "name": "model.layers.7.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006791501073166728, + "sensitivity": 0.5309201144935458 + }, + { + "name": "model.layers.7.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.384852895280346e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007062609656713903, + "sensitivity": 0.5333888521610165 + }, + { + "name": "model.layers.7.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006312994519248605, + "sensitivity": 0.5260884489707879 + }, + { + "name": "model.layers.7.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.266782293096185e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006621097563765943, + "sensitivity": 0.532186872122935 + }, + { + "name": "model.layers.7.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.972676783334464e-05, + "sensitivity": 0.8137120805645387 + }, + { + "name": "model.layers.7.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.707723739258654e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.391469262074679e-05, + "sensitivity": 0.6769786451837005 + }, + { + "name": "model.layers.7.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.745067755924538e-05, + "sensitivity": 0.6389059848053901 + }, + { + "name": "model.layers.7.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.976704642307595e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006662673549726605, + "sensitivity": 0.5775857846877668 + }, + { + "name": "model.layers.7.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 7.649958206457086e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.6349338238796918e-06, + "sensitivity": 2.0986139397860346 + }, + { + "name": "model.layers.7.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5512343907175818e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.7.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.3129277931511751e-06, + "sensitivity": 2.102411012204769 + }, + { + "name": "model.layers.7.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 6.294727882050211e-06, + "sensitivity": 2.1673653507053268 + }, + { + "name": "model.layers.7.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00017241756722796708, + "sensitivity": 0.9429004640685459 + }, + { + "name": "model.layers.7.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.210101709148148e-05, + "sensitivity": 1.681226268566732 + }, + { + "name": "model.layers.7.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.466004222398624e-05, + "sensitivity": 0.8648010873352465 + }, + { + "name": "model.layers.7.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002621706807985902, + "sensitivity": 0.7031955177702383 + }, + { + "name": "model.layers.8.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.2615861932281405e-05, + "sensitivity": 1.0870864895074375 + }, + { + "name": "model.layers.8.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.71673126614769e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006042394088581204, + "sensitivity": 0.5354667329338789 + }, + { + "name": "model.layers.8.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8776262449100614e-05, + "sensitivity": 1.1208821085470697 + }, + { + "name": "model.layers.8.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.192186674525146e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006728253792971373, + "sensitivity": 0.5221069142246312 + }, + { + "name": "model.layers.8.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.698503809981048e-05, + "sensitivity": 1.0001111275081294 + }, + { + "name": "model.layers.8.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.974013674858725e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006704336847178638, + "sensitivity": 0.537348433212655 + }, + { + "name": "model.layers.8.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5173917644424364e-05, + "sensitivity": 1.1093296374998443 + }, + { + "name": "model.layers.8.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.176166493787605e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8998397435061634e-05, + "sensitivity": 1.14767346226784 + }, + { + "name": "model.layers.8.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.240125392447226e-05, + "sensitivity": 1.0518087570225123 + }, + { + "name": "model.layers.8.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.312615141723654e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006098603480495512, + "sensitivity": 0.5841426661691032 + }, + { + "name": "model.layers.8.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.773860539193265e-05, + "sensitivity": 1.1803098653343007 + }, + { + "name": "model.layers.8.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.130306928753271e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006631077267229557, + "sensitivity": 0.5281308868041266 + }, + { + "name": "model.layers.8.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006219181232154369, + "sensitivity": 0.5448575134703897 + }, + { + "name": "model.layers.8.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.065719730941055e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006442638114094734, + "sensitivity": 0.5163258204083999 + }, + { + "name": "model.layers.8.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006509541999548674, + "sensitivity": 0.5348275117185777 + }, + { + "name": "model.layers.8.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.091271416153177e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006741936085745692, + "sensitivity": 0.553265314663232 + }, + { + "name": "model.layers.8.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.2279477889242116e-06, + "sensitivity": 2.0936203262295447 + }, + { + "name": "model.layers.8.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.948573971181759e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006497274152934551, + "sensitivity": 0.5442129085270528 + }, + { + "name": "model.layers.8.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.729049735236913e-05, + "sensitivity": 0.6627473443456809 + }, + { + "name": "model.layers.8.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.427906100725522e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006833620718680322, + "sensitivity": 0.5153162217033116 + }, + { + "name": "model.layers.8.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3337029385147616e-05, + "sensitivity": 1.1944379680014738 + }, + { + "name": "model.layers.8.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.457540055431309e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000617503363173455, + "sensitivity": 0.5215921319261468 + }, + { + "name": "model.layers.8.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006874331156723201, + "sensitivity": 0.547134638676166 + }, + { + "name": "model.layers.8.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.31044827059668e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007019065087661147, + "sensitivity": 0.5407603430707841 + }, + { + "name": "model.layers.8.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007055179448798299, + "sensitivity": 0.509056930905724 + }, + { + "name": "model.layers.8.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.370489700202597e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007130267913453281, + "sensitivity": 0.5299646684344438 + }, + { + "name": "model.layers.8.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.760023486800492e-05, + "sensitivity": 0.7655253291219766 + }, + { + "name": "model.layers.8.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.333998499030713e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006734055350534618, + "sensitivity": 0.5313576787216745 + }, + { + "name": "model.layers.8.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.859709199285135e-05, + "sensitivity": 0.6564524297873104 + }, + { + "name": "model.layers.8.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.192334467414184e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006772982887923717, + "sensitivity": 0.5499775389976215 + }, + { + "name": "model.layers.8.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.165255035739392e-05, + "sensitivity": 0.6146048110680012 + }, + { + "name": "model.layers.8.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.317042107184534e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007042891811579466, + "sensitivity": 0.5256339487359742 + }, + { + "name": "model.layers.8.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4848482250235975e-05, + "sensitivity": 0.8404102707559693 + }, + { + "name": "model.layers.8.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.936523734817456e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006279231747612357, + "sensitivity": 0.5531278251441654 + }, + { + "name": "model.layers.8.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006110720569267869, + "sensitivity": 0.552693974372499 + }, + { + "name": "model.layers.8.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.758219003837439e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006288491422310472, + "sensitivity": 0.5307159805522311 + }, + { + "name": "model.layers.8.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.245471119356807e-06, + "sensitivity": 1.6728180954190464 + }, + { + "name": "model.layers.8.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.183159714761132e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005736150778830051, + "sensitivity": 0.5123850143719645 + }, + { + "name": "model.layers.8.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4242682381300256e-05, + "sensitivity": 0.7190858800906638 + }, + { + "name": "model.layers.8.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.312208711278799e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000634278345387429, + "sensitivity": 0.5346459488169297 + }, + { + "name": "model.layers.8.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.162719753570855e-05, + "sensitivity": 0.8321288206884722 + }, + { + "name": "model.layers.8.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.777491765002196e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006078301230445504, + "sensitivity": 0.5107739932094367 + }, + { + "name": "model.layers.8.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.4775441539241e-06, + "sensitivity": 1.2515247870830233 + }, + { + "name": "model.layers.8.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.796049435957684e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005979108391329646, + "sensitivity": 0.5518671864699555 + }, + { + "name": "model.layers.8.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.914230132475495e-05, + "sensitivity": 0.6897979349771116 + }, + { + "name": "model.layers.8.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.262265515033505e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006954871350899339, + "sensitivity": 0.5276448124586104 + }, + { + "name": "model.layers.8.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0355888662161306e-05, + "sensitivity": 1.573219285400514 + }, + { + "name": "model.layers.8.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.686907679271826e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.097659934312105e-05, + "sensitivity": 0.8977643342601819 + }, + { + "name": "model.layers.8.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.843246981385164e-05, + "sensitivity": 0.7647439647580461 + }, + { + "name": "model.layers.8.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.194605361997674e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006755664362572134, + "sensitivity": 0.5012576828982775 + }, + { + "name": "model.layers.8.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006658685160800815, + "sensitivity": 0.5599304851481322 + }, + { + "name": "model.layers.8.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.972873395876377e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006737681105732918, + "sensitivity": 0.5411090158500438 + }, + { + "name": "model.layers.8.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.498531390912831e-05, + "sensitivity": 0.727280634469451 + }, + { + "name": "model.layers.8.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.195393211783085e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006391379865817726, + "sensitivity": 0.5202342725427327 + }, + { + "name": "model.layers.8.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0801223652379122e-05, + "sensitivity": 1.6465826212871875 + }, + { + "name": "model.layers.8.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.28692987447721e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006823057774454355, + "sensitivity": 0.5502517326140575 + }, + { + "name": "model.layers.8.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.072902422398329e-05, + "sensitivity": 0.7868710018713755 + }, + { + "name": "model.layers.8.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.603196993637539e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.318496187101118e-05, + "sensitivity": 0.831806749699856 + }, + { + "name": "model.layers.8.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9270067140460014e-05, + "sensitivity": 0.9470221606314492 + }, + { + "name": "model.layers.8.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.432395250361878e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.219906936166808e-05, + "sensitivity": 0.8204530712264315 + }, + { + "name": "model.layers.8.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006307018920779228, + "sensitivity": 0.5663031113229271 + }, + { + "name": "model.layers.8.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.742139705944282e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006404279265552759, + "sensitivity": 0.5307843520907931 + }, + { + "name": "model.layers.8.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.58365645701997e-05, + "sensitivity": 1.1183224216942202 + }, + { + "name": "model.layers.8.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.070342806197004e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.798276833957061e-05, + "sensitivity": 0.8440855514090759 + }, + { + "name": "model.layers.8.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0085102985613048e-05, + "sensitivity": 1.2701799638893685 + }, + { + "name": "model.layers.8.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.140813522710232e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7542521972209215e-05, + "sensitivity": 0.7488112866076663 + }, + { + "name": "model.layers.8.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006910294177941978, + "sensitivity": 0.559079180395661 + }, + { + "name": "model.layers.8.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.15346266386041e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006978041492402554, + "sensitivity": 0.5307955675491723 + }, + { + "name": "model.layers.8.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.559723649639636e-05, + "sensitivity": 1.0546937672746093 + }, + { + "name": "model.layers.8.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.614859557885211e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.779845378128812e-05, + "sensitivity": 0.89047466188325 + }, + { + "name": "model.layers.8.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.977266118861735e-05, + "sensitivity": 1.0050705665239508 + }, + { + "name": "model.layers.8.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.437505248868547e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006848713383078575, + "sensitivity": 0.5740453052245409 + }, + { + "name": "model.layers.8.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.326051905285567e-05, + "sensitivity": 0.7484268151532476 + }, + { + "name": "model.layers.8.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.179761840030551e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006288717268034816, + "sensitivity": 0.5527154260571621 + }, + { + "name": "model.layers.8.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8454064856050536e-05, + "sensitivity": 0.7150786705779367 + }, + { + "name": "model.layers.8.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.407811952158227e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000684408179949969, + "sensitivity": 0.5188308214639701 + }, + { + "name": "model.layers.8.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.666171637130901e-05, + "sensitivity": 0.8822320043884101 + }, + { + "name": "model.layers.8.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.788373869108909e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006405941094271839, + "sensitivity": 0.5391685193444248 + }, + { + "name": "model.layers.8.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006878252024762332, + "sensitivity": 0.5173512870683591 + }, + { + "name": "model.layers.8.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.281061928348208e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000707612547557801, + "sensitivity": 0.5104118713880513 + }, + { + "name": "model.layers.8.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000649136258289218, + "sensitivity": 0.5583637286815685 + }, + { + "name": "model.layers.8.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.365065701174899e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006790678016841412, + "sensitivity": 0.5398701870808521 + }, + { + "name": "model.layers.8.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9970432630507275e-05, + "sensitivity": 0.9824354208034521 + }, + { + "name": "model.layers.8.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.219751753633318e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006898745778016746, + "sensitivity": 0.5412851817838814 + }, + { + "name": "model.layers.8.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6241173297166824e-05, + "sensitivity": 0.7749969915339826 + }, + { + "name": "model.layers.8.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.167048240968143e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006554393912665546, + "sensitivity": 0.5367211935859852 + }, + { + "name": "model.layers.8.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006598454201593995, + "sensitivity": 0.5767583721453159 + }, + { + "name": "model.layers.8.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.24120730208233e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006748183513991535, + "sensitivity": 0.5080155172363683 + }, + { + "name": "model.layers.8.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.905385478399694e-05, + "sensitivity": 0.665856271178344 + }, + { + "name": "model.layers.8.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.957725761618349e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006658464553765953, + "sensitivity": 0.5192218125290777 + }, + { + "name": "model.layers.8.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.040451262379065e-05, + "sensitivity": 0.6523308956975519 + }, + { + "name": "model.layers.8.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.145505722088274e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006948718801140785, + "sensitivity": 0.5360621632377598 + }, + { + "name": "model.layers.8.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.825726839248091e-05, + "sensitivity": 0.6912991033709895 + }, + { + "name": "model.layers.8.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.398983600774955e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006741941324435174, + "sensitivity": 0.539443096116127 + }, + { + "name": "model.layers.8.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.959940608590841e-05, + "sensitivity": 0.7522959247385123 + }, + { + "name": "model.layers.8.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.98943188379053e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006651740404777229, + "sensitivity": 0.5473037128540261 + }, + { + "name": "model.layers.8.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.221517105586827e-05, + "sensitivity": 0.724214950955535 + }, + { + "name": "model.layers.8.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.525741582663613e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007223885040730238, + "sensitivity": 0.5175606066423489 + }, + { + "name": "model.layers.8.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7800934882834554e-05, + "sensitivity": 0.6747299438475869 + }, + { + "name": "model.layers.8.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.372994221237605e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006738868542015553, + "sensitivity": 0.5933618750715148 + }, + { + "name": "model.layers.8.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3238123655319214e-05, + "sensitivity": 0.9228794044449415 + }, + { + "name": "model.layers.8.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.044552947059856e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006113721756264567, + "sensitivity": 0.5482854844516507 + }, + { + "name": "model.layers.8.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5096112191677094e-05, + "sensitivity": 0.700575386381613 + }, + { + "name": "model.layers.8.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.176052238515695e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006509938393719494, + "sensitivity": 0.5001505586290487 + }, + { + "name": "model.layers.8.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0683223081286997e-05, + "sensitivity": 1.3304451987384829 + }, + { + "name": "model.layers.8.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.227409130588057e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006682439125142992, + "sensitivity": 0.5624404181209963 + }, + { + "name": "model.layers.8.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.847525244462304e-05, + "sensitivity": 1.0719372323265646 + }, + { + "name": "model.layers.8.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.076325576032104e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006915838457643986, + "sensitivity": 0.5337965375288557 + }, + { + "name": "model.layers.8.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8641715440899134e-05, + "sensitivity": 1.0080218464167219 + }, + { + "name": "model.layers.8.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.538168915743881e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.243996904231608e-05, + "sensitivity": 0.6987809043628073 + }, + { + "name": "model.layers.8.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0298905181116425e-05, + "sensitivity": 1.2494091619061605 + }, + { + "name": "model.layers.8.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.099608640397491e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6786928325891495e-05, + "sensitivity": 0.8416143552074654 + }, + { + "name": "model.layers.8.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.216136923991144e-05, + "sensitivity": 1.129060987784554 + }, + { + "name": "model.layers.8.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.794286153104622e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006110165268182755, + "sensitivity": 0.5246742407732686 + }, + { + "name": "model.layers.8.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.284371193032712e-05, + "sensitivity": 0.6055920122782452 + }, + { + "name": "model.layers.8.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.036767328827409e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007521145744249225, + "sensitivity": 0.5364995650687856 + }, + { + "name": "model.layers.8.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.813846190809272e-06, + "sensitivity": 1.457729745170581 + }, + { + "name": "model.layers.8.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.755064194090664e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006191876600496471, + "sensitivity": 0.5189783919067208 + }, + { + "name": "model.layers.8.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.909351319947746e-06, + "sensitivity": 1.2338806769986068 + }, + { + "name": "model.layers.8.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.788973567177891e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006186409736983478, + "sensitivity": 0.5417981469866897 + }, + { + "name": "model.layers.8.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.886091821594164e-05, + "sensitivity": 0.8216119413689545 + }, + { + "name": "model.layers.8.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.148775580390065e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000699042109772563, + "sensitivity": 0.5630105440949598 + }, + { + "name": "model.layers.8.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.478312596096657e-05, + "sensitivity": 0.7738089896257592 + }, + { + "name": "model.layers.8.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.509608283522539e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006335486541502178, + "sensitivity": 0.5344884353592708 + }, + { + "name": "model.layers.8.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006579881301149726, + "sensitivity": 0.5651262904664438 + }, + { + "name": "model.layers.8.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.255388029785536e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006850508507341146, + "sensitivity": 0.4983450460040795 + }, + { + "name": "model.layers.8.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.771047653979622e-05, + "sensitivity": 0.707014603468375 + }, + { + "name": "model.layers.8.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.274342467804672e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00067514757392928, + "sensitivity": 0.5853513044069409 + }, + { + "name": "model.layers.8.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 7.128865490813041e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.9909907678083982e-06, + "sensitivity": 2.0992466545881228 + }, + { + "name": "model.layers.8.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.088238832380739e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.8.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.2747664186463226e-06, + "sensitivity": 2.103351951268362 + }, + { + "name": "model.layers.8.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 5.40961445949506e-06, + "sensitivity": 2.1476848864125913 + }, + { + "name": "model.layers.8.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00016921942005865276, + "sensitivity": 1.1521923221834178 + }, + { + "name": "model.layers.8.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 5, + "mse": 3.2878731417440576e-06, + "sensitivity": 2.000065486914284 + }, + { + "name": "model.layers.8.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 3.61978163709864e-05, + "sensitivity": 0.6878365858430043 + }, + { + "name": "model.layers.8.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 4, + "mse": 5.29955759702716e-05, + "sensitivity": 1.2480728559870202 + }, + { + "name": "model.layers.9.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006718370132148266, + "sensitivity": 0.5974981442462561 + }, + { + "name": "model.layers.9.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.780824151064735e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007002022466622293, + "sensitivity": 0.5281827566171818 + }, + { + "name": "model.layers.9.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.816221528220922e-05, + "sensitivity": 0.7601869078307271 + }, + { + "name": "model.layers.9.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.991096827528963e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006589662516489625, + "sensitivity": 0.499096140686669 + }, + { + "name": "model.layers.9.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0736645536962897e-05, + "sensitivity": 0.7739035022086147 + }, + { + "name": "model.layers.9.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.385912456607912e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006955966237001121, + "sensitivity": 0.5225135115829536 + }, + { + "name": "model.layers.9.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5396863899659365e-05, + "sensitivity": 0.6349225692132343 + }, + { + "name": "model.layers.9.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.902896873521968e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006477205315604806, + "sensitivity": 0.5493347837636049 + }, + { + "name": "model.layers.9.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000625104526989162, + "sensitivity": 0.5156217196632166 + }, + { + "name": "model.layers.9.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.997364951326745e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000633592251688242, + "sensitivity": 0.5147526078118756 + }, + { + "name": "model.layers.9.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006583509966731071, + "sensitivity": 0.5401188815949858 + }, + { + "name": "model.layers.9.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.32187493465608e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000667195999994874, + "sensitivity": 0.5483101137017716 + }, + { + "name": "model.layers.9.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.472133489092812e-05, + "sensitivity": 0.7656930838232505 + }, + { + "name": "model.layers.9.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.747360205532459e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006091412506066263, + "sensitivity": 0.5245120710668897 + }, + { + "name": "model.layers.9.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006541299517266452, + "sensitivity": 0.543969560658333 + }, + { + "name": "model.layers.9.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.945041152699559e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006554305437020957, + "sensitivity": 0.510493402187641 + }, + { + "name": "model.layers.9.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0735583247151226e-05, + "sensitivity": 0.812920110599862 + }, + { + "name": "model.layers.9.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.248469842124905e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007019077311269939, + "sensitivity": 0.5184826878285639 + }, + { + "name": "model.layers.9.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.45048130536452e-05, + "sensitivity": 0.777808666053188 + }, + { + "name": "model.layers.9.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.927607500983868e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.561432383023202e-05, + "sensitivity": 0.625946443004278 + }, + { + "name": "model.layers.9.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.737854735343717e-05, + "sensitivity": 1.0055944339674798 + }, + { + "name": "model.layers.9.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.035924116076785e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006520358147099614, + "sensitivity": 0.5394258112258008 + }, + { + "name": "model.layers.9.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.815062831970863e-05, + "sensitivity": 0.7639784608296054 + }, + { + "name": "model.layers.9.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.213836059032474e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006421709549613297, + "sensitivity": 0.5363253830341523 + }, + { + "name": "model.layers.9.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 4.933826858177781e-05, + "sensitivity": 1.1897185294931552 + }, + { + "name": "model.layers.9.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.20947651239112e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005555971874855459, + "sensitivity": 0.5312537666110428 + }, + { + "name": "model.layers.9.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.498290920513682e-05, + "sensitivity": 0.8193481454629192 + }, + { + "name": "model.layers.9.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.786170618193864e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006118487799540162, + "sensitivity": 0.5405327490428831 + }, + { + "name": "model.layers.9.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 4.735418769996613e-05, + "sensitivity": 1.1345636038083384 + }, + { + "name": "model.layers.9.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.159403144716634e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 4.857263411395252e-05, + "sensitivity": 0.6716076076525119 + }, + { + "name": "model.layers.9.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.758404950029217e-05, + "sensitivity": 0.6642522631264085 + }, + { + "name": "model.layers.9.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.724800982738088e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006464474718086421, + "sensitivity": 0.5102632889321557 + }, + { + "name": "model.layers.9.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006569531979039311, + "sensitivity": 0.5450408697676192 + }, + { + "name": "model.layers.9.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.108036814111983e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006626536487601697, + "sensitivity": 0.5272941325335221 + }, + { + "name": "model.layers.9.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006700510857626796, + "sensitivity": 0.5370812749656019 + }, + { + "name": "model.layers.9.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.857401106368343e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006672595627605915, + "sensitivity": 0.5508096439260771 + }, + { + "name": "model.layers.9.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006799123948439956, + "sensitivity": 0.5237648296316144 + }, + { + "name": "model.layers.9.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.489742077064875e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006957825971767306, + "sensitivity": 0.5163109781645167 + }, + { + "name": "model.layers.9.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006354896468110383, + "sensitivity": 0.5600641966688469 + }, + { + "name": "model.layers.9.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.825729658681666e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006412089569494128, + "sensitivity": 0.5377155656907076 + }, + { + "name": "model.layers.9.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006639836356043816, + "sensitivity": 0.5385051073340629 + }, + { + "name": "model.layers.9.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.62295406073099e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006761080003343523, + "sensitivity": 0.5982812623247226 + }, + { + "name": "model.layers.9.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006710347952321172, + "sensitivity": 0.5728549837555827 + }, + { + "name": "model.layers.9.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.072683618185692e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006706896238029003, + "sensitivity": 0.5171149340226308 + }, + { + "name": "model.layers.9.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5865726608317345e-05, + "sensitivity": 0.7072570216286294 + }, + { + "name": "model.layers.9.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.863196292921202e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006323631387203932, + "sensitivity": 0.5797507117229485 + }, + { + "name": "model.layers.9.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006678564241155982, + "sensitivity": 0.5271455393129687 + }, + { + "name": "model.layers.9.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.085470545258431e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006675521726720035, + "sensitivity": 0.5303883057855083 + }, + { + "name": "model.layers.9.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6991899327840656e-05, + "sensitivity": 0.7601300056525367 + }, + { + "name": "model.layers.9.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.031857537891483e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000633547839242965, + "sensitivity": 0.516982962070228 + }, + { + "name": "model.layers.9.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007340325973927975, + "sensitivity": 0.5340304243476248 + }, + { + "name": "model.layers.9.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.962081897654571e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007695964886806905, + "sensitivity": 0.5078994421381209 + }, + { + "name": "model.layers.9.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006550386315211654, + "sensitivity": 0.5377154142950005 + }, + { + "name": "model.layers.9.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.90579134041036e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006528531666845083, + "sensitivity": 0.5348849826268476 + }, + { + "name": "model.layers.9.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.609393701888621e-05, + "sensitivity": 0.8753976464267876 + }, + { + "name": "model.layers.9.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.9379186723163e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006335391663014889, + "sensitivity": 0.5351213469846751 + }, + { + "name": "model.layers.9.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 2.1756079149781726e-05, + "sensitivity": 0.7833321942620575 + }, + { + "name": "model.layers.9.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3853144764652825e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.547999070491642e-05, + "sensitivity": 1.164623300766112 + }, + { + "name": "model.layers.9.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006561711197718978, + "sensitivity": 0.5272391993808697 + }, + { + "name": "model.layers.9.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.782071070825623e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006604896625503898, + "sensitivity": 0.5111338067878537 + }, + { + "name": "model.layers.9.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.315493035595864e-05, + "sensitivity": 1.0839796478668062 + }, + { + "name": "model.layers.9.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.819899110472761e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.337941911420785e-05, + "sensitivity": 1.1770380792568778 + }, + { + "name": "model.layers.9.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006664553075097501, + "sensitivity": 0.5148726810422262 + }, + { + "name": "model.layers.9.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.161633336887462e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006714666960760951, + "sensitivity": 0.5216714025316695 + }, + { + "name": "model.layers.9.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006479392177425325, + "sensitivity": 0.537111416048353 + }, + { + "name": "model.layers.9.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.897651931263681e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006447885534726083, + "sensitivity": 0.5256907768048952 + }, + { + "name": "model.layers.9.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006379467085935175, + "sensitivity": 0.5606197894323284 + }, + { + "name": "model.layers.9.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.898794483982783e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006464140024036169, + "sensitivity": 0.5160448963100829 + }, + { + "name": "model.layers.9.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.646627687383443e-05, + "sensitivity": 0.6637862779981396 + }, + { + "name": "model.layers.9.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.753242930950364e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006488097715191543, + "sensitivity": 0.5461852006546448 + }, + { + "name": "model.layers.9.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006542066112160683, + "sensitivity": 0.5028268773492732 + }, + { + "name": "model.layers.9.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.983508799545234e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006546530639752746, + "sensitivity": 0.5581315928798517 + }, + { + "name": "model.layers.9.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006636198377236724, + "sensitivity": 0.5288522595631724 + }, + { + "name": "model.layers.9.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.312394589258474e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006760554388165474, + "sensitivity": 0.5178451099215056 + }, + { + "name": "model.layers.9.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.771277938038111e-05, + "sensitivity": 0.6898596164861763 + }, + { + "name": "model.layers.9.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.965943614683056e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.920344119658694e-05, + "sensitivity": 0.6533553946745849 + }, + { + "name": "model.layers.9.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.702349517378025e-05, + "sensitivity": 0.6052258298862636 + }, + { + "name": "model.layers.9.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.109018724804628e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8049423387274146e-05, + "sensitivity": 0.9419921651697312 + }, + { + "name": "model.layers.9.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006789787439629436, + "sensitivity": 0.5596831470364378 + }, + { + "name": "model.layers.9.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.626685262745013e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006933552213013172, + "sensitivity": 0.5106485043591351 + }, + { + "name": "model.layers.9.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006471562664955854, + "sensitivity": 0.5271988432308534 + }, + { + "name": "model.layers.9.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.836033665218565e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006467056809924543, + "sensitivity": 0.5388931905143126 + }, + { + "name": "model.layers.9.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.2778708525002e-05, + "sensitivity": 0.6412159793331497 + }, + { + "name": "model.layers.9.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.471129836427281e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007179678650572896, + "sensitivity": 0.5418410978722 + }, + { + "name": "model.layers.9.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006732097244821489, + "sensitivity": 0.5330232195046056 + }, + { + "name": "model.layers.9.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.288195208981051e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006925577181391418, + "sensitivity": 0.5684843701598621 + }, + { + "name": "model.layers.9.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006922517786733806, + "sensitivity": 0.5101539018407268 + }, + { + "name": "model.layers.9.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.402889312084881e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007053522276692092, + "sensitivity": 0.5321877842075657 + }, + { + "name": "model.layers.9.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.682798655470833e-05, + "sensitivity": 0.8269258308350649 + }, + { + "name": "model.layers.9.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.737448868283536e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.802429950563237e-05, + "sensitivity": 1.0409294934526672 + }, + { + "name": "model.layers.9.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006695526535622776, + "sensitivity": 0.5547868347230887 + }, + { + "name": "model.layers.9.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.325420827124617e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006943633197806776, + "sensitivity": 0.5317543840998671 + }, + { + "name": "model.layers.9.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006354432553052902, + "sensitivity": 0.5467838656682416 + }, + { + "name": "model.layers.9.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.151075808702444e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006448048516176641, + "sensitivity": 0.5313684322241787 + }, + { + "name": "model.layers.9.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006414763629436493, + "sensitivity": 0.5388303555934773 + }, + { + "name": "model.layers.9.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.005046770951594e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006460507865995169, + "sensitivity": 0.5621515408507196 + }, + { + "name": "model.layers.9.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7949666370404884e-05, + "sensitivity": 0.7544313210468162 + }, + { + "name": "model.layers.9.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.707196919502167e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006404236773960292, + "sensitivity": 0.5420474606013896 + }, + { + "name": "model.layers.9.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5711978347972035e-05, + "sensitivity": 0.6038881845328038 + }, + { + "name": "model.layers.9.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.876138402527431e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006185109377838671, + "sensitivity": 0.532222388737757 + }, + { + "name": "model.layers.9.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.69464718864765e-05, + "sensitivity": 0.8191484681077827 + }, + { + "name": "model.layers.9.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.550317491222813e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006967487279325724, + "sensitivity": 0.5135653990615187 + }, + { + "name": "model.layers.9.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006351706106215715, + "sensitivity": 0.5818689608162618 + }, + { + "name": "model.layers.9.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.814083010591276e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006293735932558775, + "sensitivity": 0.5236818998698629 + }, + { + "name": "model.layers.9.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9531441365834326e-05, + "sensitivity": 0.7657038237963819 + }, + { + "name": "model.layers.9.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.322194394670078e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006659358623437583, + "sensitivity": 0.5706050703236533 + }, + { + "name": "model.layers.9.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.887925362912938e-05, + "sensitivity": 0.6436733083256816 + }, + { + "name": "model.layers.9.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.167985020510969e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006619318737648427, + "sensitivity": 0.5290108594967304 + }, + { + "name": "model.layers.9.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000656602845992893, + "sensitivity": 0.514097078460974 + }, + { + "name": "model.layers.9.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.080371122152428e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006620692438445985, + "sensitivity": 0.568789201208717 + }, + { + "name": "model.layers.9.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006903898320160806, + "sensitivity": 0.5320747061318578 + }, + { + "name": "model.layers.9.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.109157766331919e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000696411938406527, + "sensitivity": 0.5325078106600659 + }, + { + "name": "model.layers.9.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006191586144268513, + "sensitivity": 0.5337677012401997 + }, + { + "name": "model.layers.9.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.873704367331811e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006208175327628851, + "sensitivity": 0.5340733676269468 + }, + { + "name": "model.layers.9.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.85506422794424e-05, + "sensitivity": 1.194714820506499 + }, + { + "name": "model.layers.9.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.117923021520255e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9208097809460014e-05, + "sensitivity": 0.8647505672822122 + }, + { + "name": "model.layers.9.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006238574278540909, + "sensitivity": 0.5909321231899699 + }, + { + "name": "model.layers.9.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.871881967323134e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006281984969973564, + "sensitivity": 0.5243314329131529 + }, + { + "name": "model.layers.9.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006588418036699295, + "sensitivity": 0.5324520713097508 + }, + { + "name": "model.layers.9.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.034725856807199e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006730224704369903, + "sensitivity": 0.5007686089559134 + }, + { + "name": "model.layers.9.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006276955245994031, + "sensitivity": 0.5845460142024931 + }, + { + "name": "model.layers.9.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.710224399990693e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006280700908973813, + "sensitivity": 0.5702853254599627 + }, + { + "name": "model.layers.9.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000672514084726572, + "sensitivity": 0.5749996773039407 + }, + { + "name": "model.layers.9.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.177214686431398e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000683644087985158, + "sensitivity": 0.5450299781845642 + }, + { + "name": "model.layers.9.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.681595575879328e-05, + "sensitivity": 0.698562847652964 + }, + { + "name": "model.layers.9.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.900087671761867e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006465903716161847, + "sensitivity": 0.5772235276835196 + }, + { + "name": "model.layers.9.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006058806902728975, + "sensitivity": 0.5493285933578267 + }, + { + "name": "model.layers.9.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.173936526465695e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006226762197911739, + "sensitivity": 0.5387091224318223 + }, + { + "name": "model.layers.9.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 6.44470537736197e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.7904869764606701e-06, + "sensitivity": 2.098691765052987 + }, + { + "name": "model.layers.9.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4080691244089394e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.9.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.2826337751903338e-06, + "sensitivity": 2.1041024894049896 + }, + { + "name": "model.layers.9.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 8.414354851993266e-06, + "sensitivity": 2.160577951362663 + }, + { + "name": "model.layers.9.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.0002055278018815443, + "sensitivity": 0.9758394399955677 + }, + { + "name": "model.layers.9.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.1490264114399906e-05, + "sensitivity": 1.440454501502106 + }, + { + "name": "model.layers.9.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.602277087746188e-05, + "sensitivity": 1.0306058150496469 + }, + { + "name": "model.layers.9.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002935559896286577, + "sensitivity": 0.6522346903047324 + }, + { + "name": "model.layers.10.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.778962804470211e-05, + "sensitivity": 0.9808496231820867 + }, + { + "name": "model.layers.10.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.064718718334916e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006752474000677466, + "sensitivity": 0.5051718119779935 + }, + { + "name": "model.layers.10.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7534467487130314e-05, + "sensitivity": 0.9782319225309131 + }, + { + "name": "model.layers.10.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.307191367544874e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006685412372462451, + "sensitivity": 0.5393400298205797 + }, + { + "name": "model.layers.10.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.00432395003736e-05, + "sensitivity": 0.8452413977093409 + }, + { + "name": "model.layers.10.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.237079333004658e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007047789986245334, + "sensitivity": 0.5540104723202642 + }, + { + "name": "model.layers.10.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.144259532447904e-05, + "sensitivity": 0.7316004233927859 + }, + { + "name": "model.layers.10.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.603675046790158e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.32608644082211e-05, + "sensitivity": 0.6762973472588387 + }, + { + "name": "model.layers.10.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0532969099585898e-05, + "sensitivity": 1.505433341184062 + }, + { + "name": "model.layers.10.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.540019169027801e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8956076827598736e-05, + "sensitivity": 0.6448369905623841 + }, + { + "name": "model.layers.10.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.128969107521698e-05, + "sensitivity": 0.7594544275436393 + }, + { + "name": "model.layers.10.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.232529585759039e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007039706688374281, + "sensitivity": 0.5435394746504489 + }, + { + "name": "model.layers.10.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0184374888194725e-05, + "sensitivity": 0.8801975015220301 + }, + { + "name": "model.layers.10.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.127438609837554e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006880480796098709, + "sensitivity": 0.5259072770482316 + }, + { + "name": "model.layers.10.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006616414757445455, + "sensitivity": 0.5897524633967041 + }, + { + "name": "model.layers.10.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.301182793322369e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006962766638025641, + "sensitivity": 0.5461120303176393 + }, + { + "name": "model.layers.10.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.526706809177995e-05, + "sensitivity": 0.8790529909840765 + }, + { + "name": "model.layers.10.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.079139893699903e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006438078125938773, + "sensitivity": 0.5320622667209733 + }, + { + "name": "model.layers.10.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006738455849699676, + "sensitivity": 0.5930142970596674 + }, + { + "name": "model.layers.10.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.359173312375788e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007061576470732689, + "sensitivity": 0.5269607773495272 + }, + { + "name": "model.layers.10.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.776726902695373e-05, + "sensitivity": 1.1065529440385444 + }, + { + "name": "model.layers.10.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.896816901440616e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006651724688708782, + "sensitivity": 0.5327759889330748 + }, + { + "name": "model.layers.10.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.547194086830132e-05, + "sensitivity": 1.0924891877453267 + }, + { + "name": "model.layers.10.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.962087357147539e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8915960835292935e-05, + "sensitivity": 0.7262918333389989 + }, + { + "name": "model.layers.10.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4679723689332604e-05, + "sensitivity": 0.6602954846173905 + }, + { + "name": "model.layers.10.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.463331831379037e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006260558729991317, + "sensitivity": 0.5238481079451808 + }, + { + "name": "model.layers.10.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.650188076193444e-06, + "sensitivity": 1.6087106127945627 + }, + { + "name": "model.layers.10.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.706790489057312e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.335133755579591e-05, + "sensitivity": 0.8387386607626195 + }, + { + "name": "model.layers.10.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006929850205779076, + "sensitivity": 0.5436607478452298 + }, + { + "name": "model.layers.10.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.223152126949572e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007114153122529387, + "sensitivity": 0.5116419740107498 + }, + { + "name": "model.layers.10.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.842001337441616e-05, + "sensitivity": 0.7878559624336845 + }, + { + "name": "model.layers.10.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.935887088526215e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006724897539243102, + "sensitivity": 0.5328886575378998 + }, + { + "name": "model.layers.10.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.928682367084548e-05, + "sensitivity": 0.6881578893620952 + }, + { + "name": "model.layers.10.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.441488835662312e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007042217766866088, + "sensitivity": 0.5158498920603503 + }, + { + "name": "model.layers.10.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006556875305250287, + "sensitivity": 0.5920130227006183 + }, + { + "name": "model.layers.10.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.266907917051867e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006873593665659428, + "sensitivity": 0.5453190553901024 + }, + { + "name": "model.layers.10.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.944468648522161e-05, + "sensitivity": 0.7058197019870776 + }, + { + "name": "model.layers.10.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.172757593958522e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006910410593263805, + "sensitivity": 0.5080285266049768 + }, + { + "name": "model.layers.10.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.84337748377584e-06, + "sensitivity": 1.2389759961560076 + }, + { + "name": "model.layers.10.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.779098728453391e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006188277620822191, + "sensitivity": 0.5065140885537013 + }, + { + "name": "model.layers.10.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.701010741177015e-05, + "sensitivity": 0.9420418282648158 + }, + { + "name": "model.layers.10.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.981967206025729e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006688495050184429, + "sensitivity": 0.5252855386414306 + }, + { + "name": "model.layers.10.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.243365351110697e-05, + "sensitivity": 0.6244959770091504 + }, + { + "name": "model.layers.10.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.499245728264214e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007275642128661275, + "sensitivity": 0.530632388011969 + }, + { + "name": "model.layers.10.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.533221337827854e-05, + "sensitivity": 1.1751690669302712 + }, + { + "name": "model.layers.10.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.763337185271666e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006303695845417678, + "sensitivity": 0.5563235283281187 + }, + { + "name": "model.layers.10.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.940699338680133e-05, + "sensitivity": 0.6944992359452228 + }, + { + "name": "model.layers.10.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.463130262090999e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000705813872627914, + "sensitivity": 0.5336359173587198 + }, + { + "name": "model.layers.10.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1231291864532977e-05, + "sensitivity": 1.554162935144629 + }, + { + "name": "model.layers.10.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.213085725903511e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.047237548045814e-05, + "sensitivity": 0.8435829573102192 + }, + { + "name": "model.layers.10.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7614772231318057e-05, + "sensitivity": 1.087269912938866 + }, + { + "name": "model.layers.10.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.116522399679525e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006687987479381263, + "sensitivity": 0.57025976039468 + }, + { + "name": "model.layers.10.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.615534610114992e-05, + "sensitivity": 0.9512175329683256 + }, + { + "name": "model.layers.10.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.822868160976213e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006573497084900737, + "sensitivity": 0.5171680850125782 + }, + { + "name": "model.layers.10.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7809764257399365e-05, + "sensitivity": 0.8638499247696438 + }, + { + "name": "model.layers.10.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.2734079619986e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006624504458159208, + "sensitivity": 0.5434690939074788 + }, + { + "name": "model.layers.10.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.772476288257167e-05, + "sensitivity": 0.6827774957342929 + }, + { + "name": "model.layers.10.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.885822247364558e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000660410150885582, + "sensitivity": 0.5293121346377567 + }, + { + "name": "model.layers.10.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.087654527509585e-05, + "sensitivity": 1.3635356580995002 + }, + { + "name": "model.layers.10.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.922481361471e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000719210715033114, + "sensitivity": 0.5751011870033935 + }, + { + "name": "model.layers.10.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0184727216255851e-05, + "sensitivity": 1.2260693064775512 + }, + { + "name": "model.layers.10.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.573172868229449e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006366258021444082, + "sensitivity": 0.5115146495675152 + }, + { + "name": "model.layers.10.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006698633078485727, + "sensitivity": 0.5768079236272605 + }, + { + "name": "model.layers.10.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.309544460236793e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007010637782514095, + "sensitivity": 0.5276046151208734 + }, + { + "name": "model.layers.10.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4739241022616625e-05, + "sensitivity": 0.9731364141758012 + }, + { + "name": "model.layers.10.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.71595933251956e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006378927500918508, + "sensitivity": 0.5398747472891191 + }, + { + "name": "model.layers.10.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.134021532488987e-05, + "sensitivity": 0.8709408077345695 + }, + { + "name": "model.layers.10.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.511760375360609e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.34274329058826e-05, + "sensitivity": 0.71882371589081 + }, + { + "name": "model.layers.10.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.006375406286679e-05, + "sensitivity": 0.6771858240138329 + }, + { + "name": "model.layers.10.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.31224509106687e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006935363635420799, + "sensitivity": 0.5604030110397549 + }, + { + "name": "model.layers.10.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.742789289797656e-05, + "sensitivity": 1.0052689513331678 + }, + { + "name": "model.layers.10.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.866429546586005e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000650921487249434, + "sensitivity": 0.522069850279115 + }, + { + "name": "model.layers.10.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.552671427722089e-05, + "sensitivity": 1.158538280144923 + }, + { + "name": "model.layers.10.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.039290951775911e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.762848741142079e-05, + "sensitivity": 0.9010368646277446 + }, + { + "name": "model.layers.10.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0471079804119654e-05, + "sensitivity": 1.9210646470851043 + }, + { + "name": "model.layers.10.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.425506171581219e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006750381435267627, + "sensitivity": 0.5341414053330147 + }, + { + "name": "model.layers.10.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006994003779254854, + "sensitivity": 0.5686492270933112 + }, + { + "name": "model.layers.10.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.64010599393805e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000718334224075079, + "sensitivity": 0.5367061697071026 + }, + { + "name": "model.layers.10.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.887453880859539e-05, + "sensitivity": 0.8362507605393498 + }, + { + "name": "model.layers.10.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.303559985099128e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006775199435651302, + "sensitivity": 0.5485535195886381 + }, + { + "name": "model.layers.10.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.144210055936128e-05, + "sensitivity": 0.6682585427460439 + }, + { + "name": "model.layers.10.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.125196136963496e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006938920123502612, + "sensitivity": 0.5206058271769154 + }, + { + "name": "model.layers.10.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9981677622999996e-05, + "sensitivity": 0.6431723086640958 + }, + { + "name": "model.layers.10.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.057729251551791e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006922089378349483, + "sensitivity": 0.5582496069687256 + }, + { + "name": "model.layers.10.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6281387514900416e-05, + "sensitivity": 0.8003988698776401 + }, + { + "name": "model.layers.10.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.327399546535162e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006650573341175914, + "sensitivity": 0.5429115518341779 + }, + { + "name": "model.layers.10.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7886805734597147e-05, + "sensitivity": 0.7538841314440521 + }, + { + "name": "model.layers.10.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.039653044354054e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006681226077489555, + "sensitivity": 0.5520602870390326 + }, + { + "name": "model.layers.10.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1628125321294647e-05, + "sensitivity": 1.5218407304683867 + }, + { + "name": "model.layers.10.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.658849542873213e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007303711026906967, + "sensitivity": 0.53915012451045 + }, + { + "name": "model.layers.10.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8796485973289236e-05, + "sensitivity": 1.1188212545506375 + }, + { + "name": "model.layers.10.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.890545367037703e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006701587699353695, + "sensitivity": 0.5614258398081984 + }, + { + "name": "model.layers.10.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0783942899433896e-05, + "sensitivity": 1.1386557250299758 + }, + { + "name": "model.layers.10.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.191226020746399e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.22677180217579e-05, + "sensitivity": 0.8639922171816867 + }, + { + "name": "model.layers.10.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0107580793555826e-05, + "sensitivity": 0.6279555591419329 + }, + { + "name": "model.layers.10.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.181865614962589e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006940255407243967, + "sensitivity": 0.5260646146077993 + }, + { + "name": "model.layers.10.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.915312794968486e-05, + "sensitivity": 0.6100909152600885 + }, + { + "name": "model.layers.10.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.114302095738822e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006946211215108633, + "sensitivity": 0.5148680858091058 + }, + { + "name": "model.layers.10.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.64923211641144e-05, + "sensitivity": 0.7473449466492628 + }, + { + "name": "model.layers.10.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.795059792035318e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006573262508027256, + "sensitivity": 0.5162583412914175 + }, + { + "name": "model.layers.10.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.698015957023017e-05, + "sensitivity": 0.9999476831875491 + }, + { + "name": "model.layers.10.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.712337838303938e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006531418184749782, + "sensitivity": 0.5387711896575971 + }, + { + "name": "model.layers.10.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9089372371090576e-05, + "sensitivity": 0.7833055748671565 + }, + { + "name": "model.layers.10.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.964518206586945e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007000688347034156, + "sensitivity": 0.5196541942562746 + }, + { + "name": "model.layers.10.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.14955642959103e-05, + "sensitivity": 0.6710319048868427 + }, + { + "name": "model.layers.10.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.191843908709416e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007032208959572017, + "sensitivity": 0.5080426789267921 + }, + { + "name": "model.layers.10.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0548700275830925e-05, + "sensitivity": 0.8251030837695996 + }, + { + "name": "model.layers.10.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.472560016845819e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007117760251276195, + "sensitivity": 0.5133899109601321 + }, + { + "name": "model.layers.10.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.771568976342678e-05, + "sensitivity": 0.758481966186873 + }, + { + "name": "model.layers.10.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.779335197075852e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006465050973929465, + "sensitivity": 0.5183906604730939 + }, + { + "name": "model.layers.10.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007342511671595275, + "sensitivity": 0.5209691324399041 + }, + { + "name": "model.layers.10.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.674192150057934e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007591458852402866, + "sensitivity": 0.5190607569985405 + }, + { + "name": "model.layers.10.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.461570617626421e-05, + "sensitivity": 0.8783931479536159 + }, + { + "name": "model.layers.10.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.73069769416179e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006302502006292343, + "sensitivity": 0.5215380516650012 + }, + { + "name": "model.layers.10.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.777849582955241e-05, + "sensitivity": 1.0238632714599207 + }, + { + "name": "model.layers.10.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.784729637525743e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006464679609052837, + "sensitivity": 0.5561990382867451 + }, + { + "name": "model.layers.10.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.380992661230266e-05, + "sensitivity": 0.8100174360649663 + }, + { + "name": "model.layers.10.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.691909450433741e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006254971376620233, + "sensitivity": 0.539287262156092 + }, + { + "name": "model.layers.10.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.144361395854503e-05, + "sensitivity": 1.1200247679100033 + }, + { + "name": "model.layers.10.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.507192438220955e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007031867280602455, + "sensitivity": 0.5315708949210067 + }, + { + "name": "model.layers.10.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.967274046270177e-05, + "sensitivity": 0.746719720362562 + }, + { + "name": "model.layers.10.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.204717237778823e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00069528998574242, + "sensitivity": 0.56651622729987 + }, + { + "name": "model.layers.10.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.141478661447763e-05, + "sensitivity": 0.8648946498828997 + }, + { + "name": "model.layers.10.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.280773732214584e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007168831652961671, + "sensitivity": 0.5201995862694142 + }, + { + "name": "model.layers.10.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.281946843955666e-05, + "sensitivity": 0.6798635587957006 + }, + { + "name": "model.layers.10.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.243961590575054e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007604529964737594, + "sensitivity": 0.5866853242128609 + }, + { + "name": "model.layers.10.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.060205851099454e-05, + "sensitivity": 0.6125099777906133 + }, + { + "name": "model.layers.10.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.221889066182484e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007032882422208786, + "sensitivity": 0.5248706246353323 + }, + { + "name": "model.layers.10.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 6.57720556773711e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.9092685761279427e-06, + "sensitivity": 2.0988195862676102 + }, + { + "name": "model.layers.10.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.782430995779578e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.10.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.2594293821166502e-06, + "sensitivity": 2.1033093244414762 + }, + { + "name": "model.layers.10.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 2.1491863662959076e-05, + "sensitivity": 1.7644165736283748 + }, + { + "name": "model.layers.10.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00017753778956830502, + "sensitivity": 0.9936385060102264 + }, + { + "name": "model.layers.10.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 5, + "mse": 3.0599258025176823e-06, + "sensitivity": 2.10302519579803 + }, + { + "name": "model.layers.10.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 2, + "mse": 0.0004934285534545779, + "sensitivity": 0.5894430113653066 + }, + { + "name": "model.layers.10.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00029263197211548686, + "sensitivity": 0.902501797067964 + }, + { + "name": "model.layers.11.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0361402574926615e-05, + "sensitivity": 0.6023706760633327 + }, + { + "name": "model.layers.11.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.172108442115132e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007052895962260664, + "sensitivity": 0.5280479543794034 + }, + { + "name": "model.layers.11.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.796973709948361e-05, + "sensitivity": 0.8081416404807281 + }, + { + "name": "model.layers.11.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.234729426068952e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006920655723661184, + "sensitivity": 0.5008211818358708 + }, + { + "name": "model.layers.11.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.50604127056431e-05, + "sensitivity": 0.6825722054111821 + }, + { + "name": "model.layers.11.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.276766271184897e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.470716132549569e-05, + "sensitivity": 0.7387491204557114 + }, + { + "name": "model.layers.11.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8363650168757886e-05, + "sensitivity": 0.7906022137508409 + }, + { + "name": "model.layers.11.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.287403948590509e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000694180082064122, + "sensitivity": 0.5173936149719223 + }, + { + "name": "model.layers.11.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.77527898713015e-05, + "sensitivity": 1.0504680668502608 + }, + { + "name": "model.layers.11.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.632783424720401e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8749705203808844e-05, + "sensitivity": 1.1350975070586211 + }, + { + "name": "model.layers.11.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.228358688531443e-05, + "sensitivity": 0.618975170927762 + }, + { + "name": "model.layers.11.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.916468464623904e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007170757162384689, + "sensitivity": 0.5264530139960808 + }, + { + "name": "model.layers.11.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006860606372356415, + "sensitivity": 0.5438726011741133 + }, + { + "name": "model.layers.11.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.266598688853264e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007181983673945069, + "sensitivity": 0.5324002202044814 + }, + { + "name": "model.layers.11.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.403661483185715e-06, + "sensitivity": 2.097466040063141 + }, + { + "name": "model.layers.11.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.823446933092782e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.427839980460703e-05, + "sensitivity": 0.6278238452756947 + }, + { + "name": "model.layers.11.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.762535147368908e-05, + "sensitivity": 0.650545012628262 + }, + { + "name": "model.layers.11.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.37450284557417e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006798223475925624, + "sensitivity": 0.5165541623544111 + }, + { + "name": "model.layers.11.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006627188413403928, + "sensitivity": 0.5904622879878545 + }, + { + "name": "model.layers.11.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.955495794296439e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006831339560449123, + "sensitivity": 0.5784976605018954 + }, + { + "name": "model.layers.11.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006859493441879749, + "sensitivity": 0.5017361679737629 + }, + { + "name": "model.layers.11.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.405493877537083e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007233502110466361, + "sensitivity": 0.55555555551672 + }, + { + "name": "model.layers.11.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.644105112878606e-05, + "sensitivity": 0.8787458854404175 + }, + { + "name": "model.layers.11.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.439665180048905e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.937464811722748e-05, + "sensitivity": 0.7762796699869896 + }, + { + "name": "model.layers.11.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.886988219572231e-05, + "sensitivity": 0.8668026831853006 + }, + { + "name": "model.layers.11.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.19658749201335e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006812134524807334, + "sensitivity": 0.5486142293116909 + }, + { + "name": "model.layers.11.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.662973126163706e-05, + "sensitivity": 0.9019174061084743 + }, + { + "name": "model.layers.11.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.953352797405387e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006472700042650104, + "sensitivity": 0.5643055778385534 + }, + { + "name": "model.layers.11.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7433393521932885e-05, + "sensitivity": 0.9361358457705721 + }, + { + "name": "model.layers.11.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.095330829542945e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006540577742271125, + "sensitivity": 0.5438391747410771 + }, + { + "name": "model.layers.11.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006754290661774576, + "sensitivity": 0.5286697780077116 + }, + { + "name": "model.layers.11.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.571437438651628e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007088728016242385, + "sensitivity": 0.5463444711450689 + }, + { + "name": "model.layers.11.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0202095836575609e-05, + "sensitivity": 1.4232004278743426 + }, + { + "name": "model.layers.11.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.725365437887376e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.886871804250404e-05, + "sensitivity": 0.6875892995738143 + }, + { + "name": "model.layers.11.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006926845526322722, + "sensitivity": 0.5800302195806806 + }, + { + "name": "model.layers.11.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.839285333626322e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.422249134629965e-05, + "sensitivity": 0.6418741316797166 + }, + { + "name": "model.layers.11.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006565148942172527, + "sensitivity": 0.5599577061611214 + }, + { + "name": "model.layers.11.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.270253720686014e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006770341424271464, + "sensitivity": 0.5527231137950138 + }, + { + "name": "model.layers.11.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.935416993452236e-05, + "sensitivity": 1.022477491420641 + }, + { + "name": "model.layers.11.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.224217372619023e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006962606566958129, + "sensitivity": 0.5119732962936744 + }, + { + "name": "model.layers.11.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.591745866695419e-05, + "sensitivity": 0.6805142027780415 + }, + { + "name": "model.layers.11.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.949731303189765e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006670517614111304, + "sensitivity": 0.5395684475642144 + }, + { + "name": "model.layers.11.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.790618888568133e-05, + "sensitivity": 0.6380648442996587 + }, + { + "name": "model.layers.11.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.040619950908876e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006646787514910102, + "sensitivity": 0.5860625029012416 + }, + { + "name": "model.layers.11.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007038038456812501, + "sensitivity": 0.5551057678722349 + }, + { + "name": "model.layers.11.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.126035370674799e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.692273746011779e-05, + "sensitivity": 0.7558305776427597 + }, + { + "name": "model.layers.11.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.390015576267615e-05, + "sensitivity": 1.1362201423727611 + }, + { + "name": "model.layers.11.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.538638561120024e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006249562720768154, + "sensitivity": 0.5694440592479623 + }, + { + "name": "model.layers.11.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006947522051632404, + "sensitivity": 0.5144441311715582 + }, + { + "name": "model.layers.11.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.696482159895822e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007362505421042442, + "sensitivity": 0.5251897303512247 + }, + { + "name": "model.layers.11.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006693325703963637, + "sensitivity": 0.5108378074312884 + }, + { + "name": "model.layers.11.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.607107252420974e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007056001340970397, + "sensitivity": 0.528142451101946 + }, + { + "name": "model.layers.11.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006922582979314029, + "sensitivity": 0.579023753489149 + }, + { + "name": "model.layers.11.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.596705475203635e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.536625733133405e-05, + "sensitivity": 0.6089873681505772 + }, + { + "name": "model.layers.11.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.17992045590654e-05, + "sensitivity": 0.7957411506249544 + }, + { + "name": "model.layers.11.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.373907126544509e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007114330073818564, + "sensitivity": 0.5401249016879698 + }, + { + "name": "model.layers.11.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.080843048839597e-05, + "sensitivity": 1.425282703934228 + }, + { + "name": "model.layers.11.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.957941423024749e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.979530396871269e-05, + "sensitivity": 0.6012036054417664 + }, + { + "name": "model.layers.11.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.944816439296119e-05, + "sensitivity": 0.8203063577633689 + }, + { + "name": "model.layers.11.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.228935944818659e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006860228604637086, + "sensitivity": 0.5827092079854196 + }, + { + "name": "model.layers.11.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.596108894678764e-05, + "sensitivity": 0.6798547915571933 + }, + { + "name": "model.layers.11.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.9319359024812e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.64186557312496e-05, + "sensitivity": 0.8254945364652033 + }, + { + "name": "model.layers.11.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.091125396778807e-05, + "sensitivity": 0.6321540252624798 + }, + { + "name": "model.layers.11.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.220875548024196e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007153353653848171, + "sensitivity": 0.5433718656990403 + }, + { + "name": "model.layers.11.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.748809780925512e-05, + "sensitivity": 0.6948426392057012 + }, + { + "name": "model.layers.11.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.984868494124385e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.049437070032582e-05, + "sensitivity": 0.6192686923464186 + }, + { + "name": "model.layers.11.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006850312929600477, + "sensitivity": 0.5633331029419104 + }, + { + "name": "model.layers.11.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.414306881197263e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000725744990631938, + "sensitivity": 0.5369430009841447 + }, + { + "name": "model.layers.11.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006689398433081806, + "sensitivity": 0.5337652418166731 + }, + { + "name": "model.layers.11.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.300426207417331e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006982035702094436, + "sensitivity": 0.5570071063205955 + }, + { + "name": "model.layers.11.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.682997188065201e-06, + "sensitivity": 1.8274658013207374 + }, + { + "name": "model.layers.11.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.3816705758436e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005963838775642216, + "sensitivity": 0.549014354845991 + }, + { + "name": "model.layers.11.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.693256025551818e-05, + "sensitivity": 0.6572753450867674 + }, + { + "name": "model.layers.11.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.95229380451201e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006504305056296289, + "sensitivity": 0.5209342719672923 + }, + { + "name": "model.layers.11.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006721990648657084, + "sensitivity": 0.5245708008429625 + }, + { + "name": "model.layers.11.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.28543091352185e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007129220175556839, + "sensitivity": 0.5021148290848686 + }, + { + "name": "model.layers.11.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006717243231832981, + "sensitivity": 0.540784433525504 + }, + { + "name": "model.layers.11.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.134287673376093e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006887810304760933, + "sensitivity": 0.4994425966188444 + }, + { + "name": "model.layers.11.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000666693493258208, + "sensitivity": 0.5450596204860867 + }, + { + "name": "model.layers.11.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.160976226965431e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006850412464700639, + "sensitivity": 0.5384600800959418 + }, + { + "name": "model.layers.11.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.468774806009606e-06, + "sensitivity": 1.9034568831917276 + }, + { + "name": "model.layers.11.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.509797347258427e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.04466297570616e-05, + "sensitivity": 0.7891271073961957 + }, + { + "name": "model.layers.11.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.70408564171521e-06, + "sensitivity": 1.9133009934411283 + }, + { + "name": "model.layers.11.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.583925144492241e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.559333294513635e-05, + "sensitivity": 0.697246217815531 + }, + { + "name": "model.layers.11.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.218800990609452e-05, + "sensitivity": 0.9512563526268878 + }, + { + "name": "model.layers.11.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.935513283679029e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007269473280757666, + "sensitivity": 0.5544312460110434 + }, + { + "name": "model.layers.11.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.866777428309433e-05, + "sensitivity": 0.6818237236290683 + }, + { + "name": "model.layers.11.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.44535703031579e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.051356831449084e-05, + "sensitivity": 0.8535566569019615 + }, + { + "name": "model.layers.11.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006603755755349994, + "sensitivity": 0.550940301614032 + }, + { + "name": "model.layers.11.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.143900463939644e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000676508410833776, + "sensitivity": 0.5489237568247056 + }, + { + "name": "model.layers.11.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.841855899139773e-06, + "sensitivity": 1.2971400353428502 + }, + { + "name": "model.layers.11.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.618725253953016e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000631738337688148, + "sensitivity": 0.5554754834953265 + }, + { + "name": "model.layers.11.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006738192751072347, + "sensitivity": 0.5895826383135829 + }, + { + "name": "model.layers.11.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.205902423062071e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006933609838597476, + "sensitivity": 0.5189650738235299 + }, + { + "name": "model.layers.11.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.880012031411752e-05, + "sensitivity": 0.709440769729506 + }, + { + "name": "model.layers.11.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.112150003900751e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006759336101822555, + "sensitivity": 0.5492671763455518 + }, + { + "name": "model.layers.11.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.119678437244147e-05, + "sensitivity": 0.9698874659095851 + }, + { + "name": "model.layers.11.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.392330078597297e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007246757159009576, + "sensitivity": 0.5291056580223185 + }, + { + "name": "model.layers.11.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.839896039105952e-05, + "sensitivity": 0.9793326648294476 + }, + { + "name": "model.layers.11.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.638394438596151e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006820972776040435, + "sensitivity": 0.5195699758374454 + }, + { + "name": "model.layers.11.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.910825711907819e-05, + "sensitivity": 0.8155130115022294 + }, + { + "name": "model.layers.11.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.276574708863336e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006781625561416149, + "sensitivity": 0.5942577881963579 + }, + { + "name": "model.layers.11.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0248892067465931e-05, + "sensitivity": 1.274213226435846 + }, + { + "name": "model.layers.11.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.370079859152611e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7557568652555346e-05, + "sensitivity": 0.7857790677345432 + }, + { + "name": "model.layers.11.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006621081265620887, + "sensitivity": 0.5653875140227614 + }, + { + "name": "model.layers.11.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.160271368571557e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006808030302636325, + "sensitivity": 0.5245687024719512 + }, + { + "name": "model.layers.11.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.034388206899166e-05, + "sensitivity": 0.7865951118755241 + }, + { + "name": "model.layers.11.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.59787929180311e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007238417165353894, + "sensitivity": 0.531128523773392 + }, + { + "name": "model.layers.11.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000656680203974247, + "sensitivity": 0.5545149699665356 + }, + { + "name": "model.layers.11.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.142943220766028e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006878200802020729, + "sensitivity": 0.5517254511661365 + }, + { + "name": "model.layers.11.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.977490218356252e-05, + "sensitivity": 0.7728735486051791 + }, + { + "name": "model.layers.11.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.262003691721475e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.068415677873418e-05, + "sensitivity": 0.7359972130515529 + }, + { + "name": "model.layers.11.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7529086916474625e-05, + "sensitivity": 0.6541230428945418 + }, + { + "name": "model.layers.11.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.247022383831791e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006725979037582874, + "sensitivity": 0.545783899722834 + }, + { + "name": "model.layers.11.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006666940171271563, + "sensitivity": 0.5393477791381771 + }, + { + "name": "model.layers.11.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.956017048447393e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006787478923797607, + "sensitivity": 0.5193965770765014 + }, + { + "name": "model.layers.11.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007116055930964649, + "sensitivity": 0.5163983060021724 + }, + { + "name": "model.layers.11.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.512381673928758e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007416519219987094, + "sensitivity": 0.5178389475122684 + }, + { + "name": "model.layers.11.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8444922615308315e-05, + "sensitivity": 0.8261181781636844 + }, + { + "name": "model.layers.11.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.295658749877475e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000682335696183145, + "sensitivity": 0.5223030956951871 + }, + { + "name": "model.layers.11.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6408505770377815e-05, + "sensitivity": 0.6628780297005148 + }, + { + "name": "model.layers.11.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.781495815426752e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.803595558973029e-05, + "sensitivity": 0.6451308050004336 + }, + { + "name": "model.layers.11.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.899274765397422e-05, + "sensitivity": 0.6830752360480908 + }, + { + "name": "model.layers.11.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.223424406925915e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006920045125298202, + "sensitivity": 0.5066886713573628 + }, + { + "name": "model.layers.11.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0709998605307192e-05, + "sensitivity": 1.2760941291913044 + }, + { + "name": "model.layers.11.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.252533353290346e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.027795825502835e-05, + "sensitivity": 0.8235260172182701 + }, + { + "name": "model.layers.11.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006741394754499197, + "sensitivity": 0.5278701970270008 + }, + { + "name": "model.layers.11.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.105874490458518e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.221261719474569e-05, + "sensitivity": 0.6992084989593526 + }, + { + "name": "model.layers.11.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 6.385485448845429e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.8400713770461152e-06, + "sensitivity": 2.099326973997355 + }, + { + "name": "model.layers.11.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.102072360481543e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.11.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.3309794439919642e-06, + "sensitivity": 2.104988802766868 + }, + { + "name": "model.layers.11.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 6.134292107162764e-06, + "sensitivity": 2.1752904397754556 + }, + { + "name": "model.layers.11.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.0001630842889426276, + "sensitivity": 0.91040535852251 + }, + { + "name": "model.layers.11.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.0399892744317185e-05, + "sensitivity": 1.1543488108497717 + }, + { + "name": "model.layers.11.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 4.889959382126108e-05, + "sensitivity": 1.1891302646168425 + }, + { + "name": "model.layers.11.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002651199174579233, + "sensitivity": 0.7803161949184054 + }, + { + "name": "model.layers.12.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.636231799144298e-05, + "sensitivity": 0.759941182257984 + }, + { + "name": "model.layers.12.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.427370635719853e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8909979998134077e-05, + "sensitivity": 1.1783281600549604 + }, + { + "name": "model.layers.12.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.885998689336702e-05, + "sensitivity": 0.6052555123571318 + }, + { + "name": "model.layers.12.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.312442337730317e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.163920625112951e-05, + "sensitivity": 0.8114663749770405 + }, + { + "name": "model.layers.12.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.16736215306446e-05, + "sensitivity": 0.6785402879889288 + }, + { + "name": "model.layers.12.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.606627150380518e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.306769500952214e-05, + "sensitivity": 0.6194891774456395 + }, + { + "name": "model.layers.12.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000690278597176075, + "sensitivity": 0.524743339363307 + }, + { + "name": "model.layers.12.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.420559657271951e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000710082589648664, + "sensitivity": 0.5384992863421173 + }, + { + "name": "model.layers.12.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.317780935205519e-05, + "sensitivity": 0.6219981239749898 + }, + { + "name": "model.layers.12.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.580711442438769e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007336337002925575, + "sensitivity": 0.5758093757841802 + }, + { + "name": "model.layers.12.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006245928816497326, + "sensitivity": 0.5988081480886636 + }, + { + "name": "model.layers.12.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.523567097043269e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.4885458666831255e-05, + "sensitivity": 0.9914702905728707 + }, + { + "name": "model.layers.12.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.595500624622218e-05, + "sensitivity": 0.9312701325656729 + }, + { + "name": "model.layers.12.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.838442120875698e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006642492371611297, + "sensitivity": 0.5192191854100985 + }, + { + "name": "model.layers.12.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006637185579165816, + "sensitivity": 0.5257544706036732 + }, + { + "name": "model.layers.12.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.047702072464745e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006839375710114837, + "sensitivity": 0.5166358711770291 + }, + { + "name": "model.layers.12.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.008095806464553e-05, + "sensitivity": 0.6824242869315277 + }, + { + "name": "model.layers.12.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.122874083303032e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006983274943195283, + "sensitivity": 0.5483046700953289 + }, + { + "name": "model.layers.12.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007211598567664623, + "sensitivity": 0.5625624691591881 + }, + { + "name": "model.layers.12.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.72952126024029e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007581400568597019, + "sensitivity": 0.5145075777179439 + }, + { + "name": "model.layers.12.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007176985964179039, + "sensitivity": 0.5463312023465541 + }, + { + "name": "model.layers.12.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.602411986023071e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007460913620889187, + "sensitivity": 0.5287646178753407 + }, + { + "name": "model.layers.12.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.719728869735263e-05, + "sensitivity": 0.8605215666175463 + }, + { + "name": "model.layers.12.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.104115411493694e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006626652320846915, + "sensitivity": 0.5723892507682504 + }, + { + "name": "model.layers.12.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6729149946477264e-05, + "sensitivity": 0.7278545898064479 + }, + { + "name": "model.layers.12.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.902280690861517e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.847858119523153e-05, + "sensitivity": 0.6029579562844388 + }, + { + "name": "model.layers.12.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.616607813863084e-05, + "sensitivity": 0.9962050025239464 + }, + { + "name": "model.layers.12.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.272196060308488e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006395844975486398, + "sensitivity": 0.5959007710118852 + }, + { + "name": "model.layers.12.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.193454464664683e-05, + "sensitivity": 0.8596183987038384 + }, + { + "name": "model.layers.12.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.583025762869511e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.407278124243021e-05, + "sensitivity": 0.645775327782902 + }, + { + "name": "model.layers.12.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006151042180135846, + "sensitivity": 0.5715881071228238 + }, + { + "name": "model.layers.12.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.563301783695351e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.576456896960735e-05, + "sensitivity": 0.8741769960792249 + }, + { + "name": "model.layers.12.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006883294554427266, + "sensitivity": 0.5524746770111341 + }, + { + "name": "model.layers.12.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.218586463546671e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007106189150363207, + "sensitivity": 0.5664784169409872 + }, + { + "name": "model.layers.12.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.069099981687032e-05, + "sensitivity": 0.9454817582355571 + }, + { + "name": "model.layers.12.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.739806164863694e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.317460065474734e-05, + "sensitivity": 0.6607912575645426 + }, + { + "name": "model.layers.12.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007170591270551085, + "sensitivity": 0.5345769820749555 + }, + { + "name": "model.layers.12.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.787880693082116e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007515839533880353, + "sensitivity": 0.5697470816425864 + }, + { + "name": "model.layers.12.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007043037912808359, + "sensitivity": 0.5539295752609752 + }, + { + "name": "model.layers.12.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.859660857116978e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007318216376006603, + "sensitivity": 0.5338595850081986 + }, + { + "name": "model.layers.12.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006845784373581409, + "sensitivity": 0.5854048880502086 + }, + { + "name": "model.layers.12.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.328408517219941e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007082149386405945, + "sensitivity": 0.5176717430356143 + }, + { + "name": "model.layers.12.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006512944819405675, + "sensitivity": 0.5503723284355205 + }, + { + "name": "model.layers.12.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.419925284717465e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006700567901134491, + "sensitivity": 0.5211531160382458 + }, + { + "name": "model.layers.12.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006482729222625494, + "sensitivity": 0.5839189274362098 + }, + { + "name": "model.layers.12.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.799781206405896e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006592727149836719, + "sensitivity": 0.5063560594215736 + }, + { + "name": "model.layers.12.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006684426916763186, + "sensitivity": 0.5336485336249982 + }, + { + "name": "model.layers.12.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.239761205506511e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007109094294719398, + "sensitivity": 0.5174259363924817 + }, + { + "name": "model.layers.12.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006635827012360096, + "sensitivity": 0.5965074823943557 + }, + { + "name": "model.layers.12.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.283787001848395e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006861781002953649, + "sensitivity": 0.5493419119169018 + }, + { + "name": "model.layers.12.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006719328230246902, + "sensitivity": 0.5252050474422184 + }, + { + "name": "model.layers.12.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.083722610128461e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006848800694569945, + "sensitivity": 0.5463853861343517 + }, + { + "name": "model.layers.12.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.940850678598508e-05, + "sensitivity": 0.9959811344470813 + }, + { + "name": "model.layers.12.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.503490794784739e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.1132693543913774e-05, + "sensitivity": 1.2817616791606552 + }, + { + "name": "model.layers.12.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0623464378295466e-05, + "sensitivity": 0.7066081171975909 + }, + { + "name": "model.layers.12.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.67514541419223e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006964506465010345, + "sensitivity": 0.5027131402154881 + }, + { + "name": "model.layers.12.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0283608036115766e-05, + "sensitivity": 0.616603805971583 + }, + { + "name": "model.layers.12.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.302692554527312e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006913223769515753, + "sensitivity": 0.505025460798008 + }, + { + "name": "model.layers.12.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006944821216166019, + "sensitivity": 0.5823518498880056 + }, + { + "name": "model.layers.12.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.885998118377756e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007446687086485326, + "sensitivity": 0.5688143900828186 + }, + { + "name": "model.layers.12.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.674914427800104e-05, + "sensitivity": 0.6660712865562357 + }, + { + "name": "model.layers.12.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.057632049305539e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006540852482430637, + "sensitivity": 0.5245099026296792 + }, + { + "name": "model.layers.12.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.238535570446402e-05, + "sensitivity": 0.6118556346523719 + }, + { + "name": "model.layers.12.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.60478121972119e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007288106717169285, + "sensitivity": 0.5159612870846828 + }, + { + "name": "model.layers.12.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007051985594443977, + "sensitivity": 0.5340425872571704 + }, + { + "name": "model.layers.12.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.466189006459899e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007267742766998708, + "sensitivity": 0.5248515166328314 + }, + { + "name": "model.layers.12.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.385624535847455e-05, + "sensitivity": 0.8736300063846498 + }, + { + "name": "model.layers.12.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.522975925487117e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006162581848911941, + "sensitivity": 0.5334058310255637 + }, + { + "name": "model.layers.12.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006579109467566013, + "sensitivity": 0.5773858269609038 + }, + { + "name": "model.layers.12.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.718190661558765e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006853702361695468, + "sensitivity": 0.5468656353303916 + }, + { + "name": "model.layers.12.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.161972851259634e-05, + "sensitivity": 0.6290586947402512 + }, + { + "name": "model.layers.12.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.564848149537283e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007047991966828704, + "sensitivity": 0.5785443512187254 + }, + { + "name": "model.layers.12.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.58749889023602e-05, + "sensitivity": 0.8212811502582554 + }, + { + "name": "model.layers.12.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.727212505415082e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8657162298914045e-05, + "sensitivity": 0.792732587607683 + }, + { + "name": "model.layers.12.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.304238922894001e-05, + "sensitivity": 0.7313718832234587 + }, + { + "name": "model.layers.12.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.779403065593215e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000730621803086251, + "sensitivity": 0.5567458527328897 + }, + { + "name": "model.layers.12.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7611610827734694e-05, + "sensitivity": 1.0870911758806787 + }, + { + "name": "model.layers.12.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.415647249014e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9877980675082654e-05, + "sensitivity": 0.9761021390666428 + }, + { + "name": "model.layers.12.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.00541643507313e-05, + "sensitivity": 0.7208335181804948 + }, + { + "name": "model.layers.12.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.413828259610455e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007322716410271823, + "sensitivity": 0.5298101616918476 + }, + { + "name": "model.layers.12.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.419850251404569e-05, + "sensitivity": 0.6073675110651314 + }, + { + "name": "model.layers.12.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.151706995500717e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007453008438460529, + "sensitivity": 0.5452027474865949 + }, + { + "name": "model.layers.12.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.186957762110978e-05, + "sensitivity": 0.7889542365813849 + }, + { + "name": "model.layers.12.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.502183964585129e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007367273792624474, + "sensitivity": 0.5953982299213705 + }, + { + "name": "model.layers.12.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.780162973678671e-05, + "sensitivity": 0.7734870348426193 + }, + { + "name": "model.layers.12.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.091003683650342e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006675328477285802, + "sensitivity": 0.5405408303012746 + }, + { + "name": "model.layers.12.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.146676605567336e-05, + "sensitivity": 0.7816314965604535 + }, + { + "name": "model.layers.12.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.444603855015885e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007009041728451848, + "sensitivity": 0.5102425379002148 + }, + { + "name": "model.layers.12.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.786094334325753e-05, + "sensitivity": 0.7669438416807197 + }, + { + "name": "model.layers.12.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.27041060852207e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006651963340118527, + "sensitivity": 0.5817342957048908 + }, + { + "name": "model.layers.12.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007323298486880958, + "sensitivity": 0.5166590418411565 + }, + { + "name": "model.layers.12.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.707585953336093e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007603932172060013, + "sensitivity": 0.5292782400807197 + }, + { + "name": "model.layers.12.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7907323935069144e-05, + "sensitivity": 1.004960405898511 + }, + { + "name": "model.layers.12.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.862941290819435e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006639162893407047, + "sensitivity": 0.548907375743311 + }, + { + "name": "model.layers.12.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006751944310963154, + "sensitivity": 0.5890137764023573 + }, + { + "name": "model.layers.12.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.239547474251594e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.22452498646453e-05, + "sensitivity": 0.6603000649427458 + }, + { + "name": "model.layers.12.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006585297523997724, + "sensitivity": 0.5311659798909181 + }, + { + "name": "model.layers.12.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.011956656948314e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006844803574495018, + "sensitivity": 0.5314891345534339 + }, + { + "name": "model.layers.12.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007072719745337963, + "sensitivity": 0.53490122451838 + }, + { + "name": "model.layers.12.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.691041107842466e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007390842656604946, + "sensitivity": 0.5241588671009685 + }, + { + "name": "model.layers.12.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.484713983605616e-05, + "sensitivity": 0.8511848218081453 + }, + { + "name": "model.layers.12.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.514946792573028e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006099209422245622, + "sensitivity": 0.561864462305743 + }, + { + "name": "model.layers.12.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.809974391013384e-05, + "sensitivity": 0.7752764838575913 + }, + { + "name": "model.layers.12.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.017108944433858e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.836947093484923e-05, + "sensitivity": 0.8518957944026155 + }, + { + "name": "model.layers.12.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000695945811457932, + "sensitivity": 0.5808690172160238 + }, + { + "name": "model.layers.12.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.415431812456518e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007319545256905258, + "sensitivity": 0.5106654008651896 + }, + { + "name": "model.layers.12.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006759455427527428, + "sensitivity": 0.5297197531006302 + }, + { + "name": "model.layers.12.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.26090752575692e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007022283971309662, + "sensitivity": 0.5227785144235431 + }, + { + "name": "model.layers.12.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0307262174319476e-05, + "sensitivity": 0.8761861824537265 + }, + { + "name": "model.layers.12.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.386932795976463e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006974959978833795, + "sensitivity": 0.5341785236819516 + }, + { + "name": "model.layers.12.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.196570757310838e-05, + "sensitivity": 0.6480543425900495 + }, + { + "name": "model.layers.12.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.556338121299632e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007126411655917764, + "sensitivity": 0.5170662940090835 + }, + { + "name": "model.layers.12.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0801064490806311e-05, + "sensitivity": 1.856151173347638 + }, + { + "name": "model.layers.12.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.284759592745104e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006966108921915293, + "sensitivity": 0.5420684024716232 + }, + { + "name": "model.layers.12.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.263422255869955e-05, + "sensitivity": 0.7115034837371867 + }, + { + "name": "model.layers.12.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.878997282910859e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007527022971771657, + "sensitivity": 0.5329304014663769 + }, + { + "name": "model.layers.12.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9890324337175116e-05, + "sensitivity": 0.6643975490737969 + }, + { + "name": "model.layers.12.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.158810492706834e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006951118703000247, + "sensitivity": 0.5748505417588756 + }, + { + "name": "model.layers.12.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000683491351082921, + "sensitivity": 0.554210340379596 + }, + { + "name": "model.layers.12.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.245331292120682e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007000734331086278, + "sensitivity": 0.5481569993152704 + }, + { + "name": "model.layers.12.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.06515932304319e-05, + "sensitivity": 0.6110218055036527 + }, + { + "name": "model.layers.12.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.449399734265171e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006991593400016427, + "sensitivity": 0.5239039827362704 + }, + { + "name": "model.layers.12.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0656690392352175e-05, + "sensitivity": 1.281168874430988 + }, + { + "name": "model.layers.12.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.129753723551403e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.814119867864065e-05, + "sensitivity": 0.8146663146216453 + }, + { + "name": "model.layers.12.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0369155461376067e-05, + "sensitivity": 1.4073382385969764 + }, + { + "name": "model.layers.12.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.251212880670209e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006831069476902485, + "sensitivity": 0.5749013438627224 + }, + { + "name": "model.layers.12.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8865563914878294e-05, + "sensitivity": 1.06878296463252 + }, + { + "name": "model.layers.12.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.393595413101139e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007081844378262758, + "sensitivity": 0.5352382692357747 + }, + { + "name": "model.layers.12.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 7.578591066703666e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.992287479879451e-06, + "sensitivity": 2.0987521082387626 + }, + { + "name": "model.layers.12.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.026938189686916e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.12.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 6.208537342899945e-06, + "sensitivity": 1.8711669473939367 + }, + { + "name": "model.layers.12.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 2.2511312636197545e-05, + "sensitivity": 1.9150231379964497 + }, + { + "name": "model.layers.12.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.0001565248385304585, + "sensitivity": 1.0476692840587734 + }, + { + "name": "model.layers.12.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.235627587448107e-05, + "sensitivity": 1.934892637538176 + }, + { + "name": "model.layers.12.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 2, + "mse": 0.0005378288915380836, + "sensitivity": 0.5895019700751076 + }, + { + "name": "model.layers.12.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00027789006708189845, + "sensitivity": 0.807532544710627 + }, + { + "name": "model.layers.13.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006705971900373697, + "sensitivity": 0.5418482597497432 + }, + { + "name": "model.layers.13.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.104689873609459e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000683736230712384, + "sensitivity": 0.5322144039325415 + }, + { + "name": "model.layers.13.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8918300055665895e-05, + "sensitivity": 0.7330366477697594 + }, + { + "name": "model.layers.13.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.298735115706222e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006687843124382198, + "sensitivity": 0.5161391331175633 + }, + { + "name": "model.layers.13.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0258132533635944e-05, + "sensitivity": 1.2529397344145543 + }, + { + "name": "model.layers.13.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.859164957655594e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000638830941170454, + "sensitivity": 0.5099671450630836 + }, + { + "name": "model.layers.13.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.969023550278507e-05, + "sensitivity": 0.9028159954690793 + }, + { + "name": "model.layers.13.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.478475711446663e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007094345055520535, + "sensitivity": 0.5768295944073324 + }, + { + "name": "model.layers.13.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007315609836950898, + "sensitivity": 0.5593875736758074 + }, + { + "name": "model.layers.13.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.61428828152566e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007571796304546297, + "sensitivity": 0.5149253875718489 + }, + { + "name": "model.layers.13.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006658544298261404, + "sensitivity": 0.5359408541017547 + }, + { + "name": "model.layers.13.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.266459990911244e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006931519019417465, + "sensitivity": 0.5371587892424631 + }, + { + "name": "model.layers.13.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.828064604429528e-05, + "sensitivity": 0.7821515051272174 + }, + { + "name": "model.layers.13.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.320101988421811e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006783092394471169, + "sensitivity": 0.5268608277509137 + }, + { + "name": "model.layers.13.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.405344902304932e-05, + "sensitivity": 0.6630617834159483 + }, + { + "name": "model.layers.13.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.282798151209136e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007611599285155535, + "sensitivity": 0.5363047656552119 + }, + { + "name": "model.layers.13.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007043571094982326, + "sensitivity": 0.5170317024911938 + }, + { + "name": "model.layers.13.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.710947673127521e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007497264887206256, + "sensitivity": 0.5401092460648746 + }, + { + "name": "model.layers.13.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.044582859321963e-05, + "sensitivity": 1.5634469974958918 + }, + { + "name": "model.layers.13.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.233140652511793e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.022433444741182e-05, + "sensitivity": 0.6452758818108215 + }, + { + "name": "model.layers.13.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0057850886369124e-05, + "sensitivity": 1.2393276483625564 + }, + { + "name": "model.layers.13.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.76686306380725e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006576689193025231, + "sensitivity": 0.5234686715334745 + }, + { + "name": "model.layers.13.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.202467920957133e-05, + "sensitivity": 0.7241771981638798 + }, + { + "name": "model.layers.13.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1245350606259308e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007177807274274528, + "sensitivity": 0.5274597427284188 + }, + { + "name": "model.layers.13.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6647892051842064e-05, + "sensitivity": 0.8248015733301655 + }, + { + "name": "model.layers.13.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.402883852591913e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.717950261896476e-05, + "sensitivity": 0.6403121828619804 + }, + { + "name": "model.layers.13.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007011740235611796, + "sensitivity": 0.5590657571429916 + }, + { + "name": "model.layers.13.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.408408808056265e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007200231775641441, + "sensitivity": 0.5367367028080665 + }, + { + "name": "model.layers.13.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.98106998950243e-05, + "sensitivity": 0.7439584363405798 + }, + { + "name": "model.layers.13.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.688398457299627e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007016637828201056, + "sensitivity": 0.5089717111989815 + }, + { + "name": "model.layers.13.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.420414865715429e-05, + "sensitivity": 0.6600545217049201 + }, + { + "name": "model.layers.13.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.475464371964335e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007460989872924984, + "sensitivity": 0.5729863193301702 + }, + { + "name": "model.layers.13.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.857076757820323e-05, + "sensitivity": 1.161018904821625 + }, + { + "name": "model.layers.13.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.665043307904853e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.133363058324903e-05, + "sensitivity": 0.75392578187197 + }, + { + "name": "model.layers.13.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007242028368636966, + "sensitivity": 0.5340912451292371 + }, + { + "name": "model.layers.13.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.593145371880382e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007510663708671927, + "sensitivity": 0.556822898814817 + }, + { + "name": "model.layers.13.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006651420844718814, + "sensitivity": 0.537471803954744 + }, + { + "name": "model.layers.13.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.493305590993259e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006838254630565643, + "sensitivity": 0.5046802066622342 + }, + { + "name": "model.layers.13.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.852907634107396e-05, + "sensitivity": 0.6019217572938944 + }, + { + "name": "model.layers.13.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.288511258389917e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007051086286082864, + "sensitivity": 0.5610005585605815 + }, + { + "name": "model.layers.13.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9965805121464655e-05, + "sensitivity": 0.803433359058456 + }, + { + "name": "model.layers.13.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.426313348129042e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007107971468940377, + "sensitivity": 0.5124178423144684 + }, + { + "name": "model.layers.13.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.299755477812141e-05, + "sensitivity": 0.7270705984012271 + }, + { + "name": "model.layers.13.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.566921797457326e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007494239835068583, + "sensitivity": 0.5402497718071926 + }, + { + "name": "model.layers.13.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.822919411002658e-05, + "sensitivity": 0.6355970953416358 + }, + { + "name": "model.layers.13.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.276121666815015e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.054139157640748e-05, + "sensitivity": 0.8598011770048394 + }, + { + "name": "model.layers.13.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007017932366579771, + "sensitivity": 0.5439270217786126 + }, + { + "name": "model.layers.13.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.641583922828431e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000721562304534018, + "sensitivity": 0.5559405541089271 + }, + { + "name": "model.layers.13.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.438120908569545e-05, + "sensitivity": 0.8176482380656251 + }, + { + "name": "model.layers.13.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.880265805695672e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.434034730773419e-05, + "sensitivity": 0.634363924776348 + }, + { + "name": "model.layers.13.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006877341656945646, + "sensitivity": 0.5916884303959782 + }, + { + "name": "model.layers.13.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.652644515270367e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007265376625582576, + "sensitivity": 0.5367827979677593 + }, + { + "name": "model.layers.13.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000657983124256134, + "sensitivity": 0.5460789233439325 + }, + { + "name": "model.layers.13.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.925389245931001e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006730548338964581, + "sensitivity": 0.506115395223929 + }, + { + "name": "model.layers.13.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007061773794703186, + "sensitivity": 0.5564259195725404 + }, + { + "name": "model.layers.13.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.850825684523443e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007307949708774686, + "sensitivity": 0.5425764461643929 + }, + { + "name": "model.layers.13.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1806369002442807e-05, + "sensitivity": 1.2588698300122558 + }, + { + "name": "model.layers.13.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.826149044376507e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.956540164537728e-05, + "sensitivity": 0.6597936191563625 + }, + { + "name": "model.layers.13.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000702214427292347, + "sensitivity": 0.5583391136751825 + }, + { + "name": "model.layers.13.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.766457545381854e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007205373840406537, + "sensitivity": 0.5308899788893989 + }, + { + "name": "model.layers.13.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006596962921321392, + "sensitivity": 0.5708021702944801 + }, + { + "name": "model.layers.13.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.959066129435087e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.942365896771662e-05, + "sensitivity": 0.610312809173613 + }, + { + "name": "model.layers.13.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006809655460529029, + "sensitivity": 0.5829784180406694 + }, + { + "name": "model.layers.13.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.538148227264173e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007335233385674655, + "sensitivity": 0.5414627804128236 + }, + { + "name": "model.layers.13.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9437337768031284e-05, + "sensitivity": 0.9473804963533099 + }, + { + "name": "model.layers.13.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.781747513035953e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.031511293258518e-05, + "sensitivity": 0.8157532096467046 + }, + { + "name": "model.layers.13.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007286419859156013, + "sensitivity": 0.55683918945083 + }, + { + "name": "model.layers.13.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.966896535232081e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007589161396026611, + "sensitivity": 0.547234537338825 + }, + { + "name": "model.layers.13.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.217305781319737e-05, + "sensitivity": 0.6466447375250708 + }, + { + "name": "model.layers.13.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.812196033934015e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007595595670863986, + "sensitivity": 0.5166545779943985 + }, + { + "name": "model.layers.13.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007004259969107807, + "sensitivity": 0.5257467957320046 + }, + { + "name": "model.layers.13.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.562853513969458e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007197301601991057, + "sensitivity": 0.537577327987681 + }, + { + "name": "model.layers.13.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006650143186561763, + "sensitivity": 0.5064377206493583 + }, + { + "name": "model.layers.13.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.008747277519433e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006847957847639918, + "sensitivity": 0.5345804911308001 + }, + { + "name": "model.layers.13.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.024158210493624e-05, + "sensitivity": 0.6819080305607849 + }, + { + "name": "model.layers.13.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.324264631984988e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006958772428333759, + "sensitivity": 0.5503256189531173 + }, + { + "name": "model.layers.13.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.181489152368158e-05, + "sensitivity": 0.6775718163632408 + }, + { + "name": "model.layers.13.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.206751545003499e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.401163409464061e-05, + "sensitivity": 0.6667229417017793 + }, + { + "name": "model.layers.13.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000679697550367564, + "sensitivity": 0.5342462993443657 + }, + { + "name": "model.layers.13.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.535166789944924e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007408942328765988, + "sensitivity": 0.5462068178342693 + }, + { + "name": "model.layers.13.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.790631257696077e-05, + "sensitivity": 1.0133839198565133 + }, + { + "name": "model.layers.13.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3056281886747456e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.034310717950575e-05, + "sensitivity": 1.0299393227124674 + }, + { + "name": "model.layers.13.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000705104204826057, + "sensitivity": 0.5440496919465222 + }, + { + "name": "model.layers.13.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.808463695051614e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007264238665811718, + "sensitivity": 0.5118185704971003 + }, + { + "name": "model.layers.13.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.05301174800843e-05, + "sensitivity": 0.8396026136695491 + }, + { + "name": "model.layers.13.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.445295639423421e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006891838274896145, + "sensitivity": 0.5279721094025157 + }, + { + "name": "model.layers.13.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.228846905287355e-05, + "sensitivity": 0.9172532659546316 + }, + { + "name": "model.layers.13.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.713593165841303e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007203062996268272, + "sensitivity": 0.5557897836704917 + }, + { + "name": "model.layers.13.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.298576772678643e-05, + "sensitivity": 0.710141172354313 + }, + { + "name": "model.layers.13.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.525521030198433e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007246903842315078, + "sensitivity": 0.5176168997223963 + }, + { + "name": "model.layers.13.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.527234654640779e-05, + "sensitivity": 0.6134318375746868 + }, + { + "name": "model.layers.13.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.258151981659466e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007720102439634502, + "sensitivity": 0.5889224034714904 + }, + { + "name": "model.layers.13.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7006236602319404e-05, + "sensitivity": 0.8686722991269762 + }, + { + "name": "model.layers.13.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.012977564751054e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000646440195851028, + "sensitivity": 0.5456577317382206 + }, + { + "name": "model.layers.13.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006992561975494027, + "sensitivity": 0.5907440903667776 + }, + { + "name": "model.layers.13.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.626024742217851e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000746759760659188, + "sensitivity": 0.5347358460399324 + }, + { + "name": "model.layers.13.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.1390333131421357e-06, + "sensitivity": 2.097142131232253 + }, + { + "name": "model.layers.13.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.257828886191419e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006342150154523551, + "sensitivity": 0.5867642382041823 + }, + { + "name": "model.layers.13.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.397015386028215e-05, + "sensitivity": 0.8487237990698264 + }, + { + "name": "model.layers.13.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.588140533698606e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.674084579572082e-05, + "sensitivity": 0.6347324397784037 + }, + { + "name": "model.layers.13.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.297070649452507e-05, + "sensitivity": 0.6412547881785828 + }, + { + "name": "model.layers.13.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.56680981592217e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.577970634680241e-05, + "sensitivity": 0.7378154670210785 + }, + { + "name": "model.layers.13.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006760961259715259, + "sensitivity": 0.5964924607680248 + }, + { + "name": "model.layers.13.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.363969760059263e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006821169517934322, + "sensitivity": 0.5617305142838773 + }, + { + "name": "model.layers.13.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.047442366252653e-05, + "sensitivity": 0.7186710208753743 + }, + { + "name": "model.layers.13.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.652358024439309e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006946390494704247, + "sensitivity": 0.5861683210423596 + }, + { + "name": "model.layers.13.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000663559592794627, + "sensitivity": 0.5114296921292939 + }, + { + "name": "model.layers.13.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.967132210571435e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006816376699134707, + "sensitivity": 0.5900383227126988 + }, + { + "name": "model.layers.13.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006749517051503062, + "sensitivity": 0.5549459888235914 + }, + { + "name": "model.layers.13.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.209310186022776e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007015386363491416, + "sensitivity": 0.5273847693322626 + }, + { + "name": "model.layers.13.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7939520047511905e-05, + "sensitivity": 0.6561468017299673 + }, + { + "name": "model.layers.13.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.098159133216541e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006763784913346171, + "sensitivity": 0.5317467416830755 + }, + { + "name": "model.layers.13.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.870843233424239e-05, + "sensitivity": 0.6232871830775193 + }, + { + "name": "model.layers.13.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.80344214742945e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006642249645665288, + "sensitivity": 0.5748447298135455 + }, + { + "name": "model.layers.13.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006707921857014298, + "sensitivity": 0.5798794080686547 + }, + { + "name": "model.layers.13.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.265552201512037e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007067783735692501, + "sensitivity": 0.5043957414094913 + }, + { + "name": "model.layers.13.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006925404886715114, + "sensitivity": 0.5412814125525611 + }, + { + "name": "model.layers.13.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.361624400597066e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007243709405884147, + "sensitivity": 0.5788457366618766 + }, + { + "name": "model.layers.13.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.513237167382613e-05, + "sensitivity": 0.9362962450225583 + }, + { + "name": "model.layers.13.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.48554953133862e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007813346455805004, + "sensitivity": 0.531018691177048 + }, + { + "name": "model.layers.13.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006926512578502297, + "sensitivity": 0.5244504915199122 + }, + { + "name": "model.layers.13.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.271530992307817e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007068172562867403, + "sensitivity": 0.5665036049315471 + }, + { + "name": "model.layers.13.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000684476166497916, + "sensitivity": 0.5860145444792346 + }, + { + "name": "model.layers.13.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.396858225343749e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007099999347701669, + "sensitivity": 0.5096769626380164 + }, + { + "name": "model.layers.13.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.78506660531275e-05, + "sensitivity": 0.8498135862858365 + }, + { + "name": "model.layers.13.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.005404422168795e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.94886441831477e-05, + "sensitivity": 0.612439734281197 + }, + { + "name": "model.layers.13.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007072924636304379, + "sensitivity": 0.5432184665027648 + }, + { + "name": "model.layers.13.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.91239051775483e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007575529161840677, + "sensitivity": 0.5926635555288478 + }, + { + "name": "model.layers.13.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 7.023246325843502e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.9417202565819025e-06, + "sensitivity": 2.0990889568773845 + }, + { + "name": "model.layers.13.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.988203722357866e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.13.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.48803565025446e-06, + "sensitivity": 2.105817594416845 + }, + { + "name": "model.layers.13.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 5.592394700215664e-06, + "sensitivity": 2.1730539557518287 + }, + { + "name": "model.layers.13.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00016621100076008588, + "sensitivity": 1.0622823339169334 + }, + { + "name": "model.layers.13.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.2051654266542755e-05, + "sensitivity": 1.5805417042889367 + }, + { + "name": "model.layers.13.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.4553205700358376e-05, + "sensitivity": 0.7561287938176162 + }, + { + "name": "model.layers.13.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00027277428307570517, + "sensitivity": 0.8600608511230464 + }, + { + "name": "model.layers.14.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9268990298733115e-05, + "sensitivity": 0.6322325016396934 + }, + { + "name": "model.layers.14.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.612514766857203e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.099935853853822e-05, + "sensitivity": 0.6065561518180216 + }, + { + "name": "model.layers.14.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.182621291372925e-05, + "sensitivity": 0.7905661764359047 + }, + { + "name": "model.layers.14.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.665406431238807e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006953291594982147, + "sensitivity": 0.5638319062949773 + }, + { + "name": "model.layers.14.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006711941678076982, + "sensitivity": 0.5258299497159836 + }, + { + "name": "model.layers.14.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.256394158299372e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007004779763519764, + "sensitivity": 0.5196989868154835 + }, + { + "name": "model.layers.14.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.136541196610779e-05, + "sensitivity": 0.7325720351847427 + }, + { + "name": "model.layers.14.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.419115834432887e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007138288347050548, + "sensitivity": 0.5232279602288801 + }, + { + "name": "model.layers.14.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0114781616721302e-05, + "sensitivity": 1.4089211817374212 + }, + { + "name": "model.layers.14.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.764561592513928e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006350773619487882, + "sensitivity": 0.548971630127804 + }, + { + "name": "model.layers.14.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.358754762914032e-05, + "sensitivity": 0.6707808366771462 + }, + { + "name": "model.layers.14.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.295035970855679e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.626039248658344e-05, + "sensitivity": 0.7282526931636053 + }, + { + "name": "model.layers.14.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.521831528516486e-05, + "sensitivity": 0.7615765748472758 + }, + { + "name": "model.layers.14.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.99384600011399e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007584767299704254, + "sensitivity": 0.5317295669804039 + }, + { + "name": "model.layers.14.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0202062185271643e-05, + "sensitivity": 1.4839098967390707 + }, + { + "name": "model.layers.14.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.659653877250094e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006286596180871129, + "sensitivity": 0.5130713167803612 + }, + { + "name": "model.layers.14.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.646835415973328e-05, + "sensitivity": 0.9761927693431046 + }, + { + "name": "model.layers.14.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.526640277115803e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000634396041277796, + "sensitivity": 0.5233997021729639 + }, + { + "name": "model.layers.14.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.841189340571873e-05, + "sensitivity": 0.7756194531827675 + }, + { + "name": "model.layers.14.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.164216301840497e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006668863352388144, + "sensitivity": 0.5696541462353261 + }, + { + "name": "model.layers.14.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9959151258226484e-05, + "sensitivity": 0.8673797323741852 + }, + { + "name": "model.layers.14.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.190503765741596e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006811079801991582, + "sensitivity": 0.555259330947314 + }, + { + "name": "model.layers.14.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.44987085252069e-05, + "sensitivity": 0.83294562661065 + }, + { + "name": "model.layers.14.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.034919005694974e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007518300553783774, + "sensitivity": 0.5832566696712773 + }, + { + "name": "model.layers.14.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0158889381273184e-05, + "sensitivity": 1.9870995959226678 + }, + { + "name": "model.layers.14.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4533732155541657e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.576657713390887e-05, + "sensitivity": 0.6897397724933797 + }, + { + "name": "model.layers.14.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.17035329923965e-05, + "sensitivity": 0.8119272346240194 + }, + { + "name": "model.layers.14.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.546405870722083e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.349570321617648e-05, + "sensitivity": 0.7276692070714615 + }, + { + "name": "model.layers.14.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.008361742715351e-05, + "sensitivity": 0.6571453659062083 + }, + { + "name": "model.layers.14.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.459359150947421e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000674002687446773, + "sensitivity": 0.5249109866804119 + }, + { + "name": "model.layers.14.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.815521581098437e-05, + "sensitivity": 0.7648110755693622 + }, + { + "name": "model.layers.14.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.845793111802777e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006603134097531438, + "sensitivity": 0.5496829632191528 + }, + { + "name": "model.layers.14.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0950413525279146e-05, + "sensitivity": 1.7174246659667134 + }, + { + "name": "model.layers.14.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.614212679778575e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00069773307768628, + "sensitivity": 0.5500594645690452 + }, + { + "name": "model.layers.14.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007036286406219006, + "sensitivity": 0.5546038689569099 + }, + { + "name": "model.layers.14.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.049206942610908e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007197256200015545, + "sensitivity": 0.5375633341152615 + }, + { + "name": "model.layers.14.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.03454936936032e-05, + "sensitivity": 0.8128724431042207 + }, + { + "name": "model.layers.14.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.427541165976436e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006928577786311507, + "sensitivity": 0.5402750014968624 + }, + { + "name": "model.layers.14.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0622289311140776e-05, + "sensitivity": 0.9521343935491201 + }, + { + "name": "model.layers.14.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.727292998220946e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007034544833004475, + "sensitivity": 0.524078366802857 + }, + { + "name": "model.layers.14.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.076219450624194e-05, + "sensitivity": 1.2096129914076144 + }, + { + "name": "model.layers.14.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.314782012850628e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000694778747856617, + "sensitivity": 0.5680851335421734 + }, + { + "name": "model.layers.14.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.165176455397159e-05, + "sensitivity": 0.6773202865689553 + }, + { + "name": "model.layers.14.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.102424888216774e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006895895348861814, + "sensitivity": 0.5435347648055046 + }, + { + "name": "model.layers.14.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.373008363880217e-05, + "sensitivity": 0.6552417846466466 + }, + { + "name": "model.layers.14.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.864644319648505e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007339939475059509, + "sensitivity": 0.5317276674689597 + }, + { + "name": "model.layers.14.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4876913054613397e-05, + "sensitivity": 0.6604132150762192 + }, + { + "name": "model.layers.14.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.782500807072211e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000646826985757798, + "sensitivity": 0.5133493342609248 + }, + { + "name": "model.layers.14.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006695803604088724, + "sensitivity": 0.5488528584017298 + }, + { + "name": "model.layers.14.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.217260306584649e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007011896814219654, + "sensitivity": 0.5237389776281608 + }, + { + "name": "model.layers.14.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.062864849809557e-05, + "sensitivity": 1.02116531938687 + }, + { + "name": "model.layers.14.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.544739221681084e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006979169556871057, + "sensitivity": 0.5273634391402818 + }, + { + "name": "model.layers.14.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1121813258796465e-05, + "sensitivity": 1.5328731130574724 + }, + { + "name": "model.layers.14.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.216898214006505e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006979742320254445, + "sensitivity": 0.5874986646061198 + }, + { + "name": "model.layers.14.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007048522820696235, + "sensitivity": 0.5783158397346168 + }, + { + "name": "model.layers.14.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.538946308864979e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007455623708665371, + "sensitivity": 0.5415162373220693 + }, + { + "name": "model.layers.14.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.026985283824615e-05, + "sensitivity": 0.6070173589338724 + }, + { + "name": "model.layers.14.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.694330636491941e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.111695984145626e-05, + "sensitivity": 0.634308091507239 + }, + { + "name": "model.layers.14.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.911339758313261e-05, + "sensitivity": 0.6973177695591772 + }, + { + "name": "model.layers.14.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.594434012185957e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006921462481841445, + "sensitivity": 0.5520639981231106 + }, + { + "name": "model.layers.14.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.929524195380509e-05, + "sensitivity": 0.6216219172089211 + }, + { + "name": "model.layers.14.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.540525419040932e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006809606566093862, + "sensitivity": 0.552576858458307 + }, + { + "name": "model.layers.14.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0014303370553534e-05, + "sensitivity": 1.5043533379375933 + }, + { + "name": "model.layers.14.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.854338951394311e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006361134583130479, + "sensitivity": 0.5331196971126233 + }, + { + "name": "model.layers.14.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.661091927322559e-05, + "sensitivity": 0.9414730058696977 + }, + { + "name": "model.layers.14.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.892927674722159e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006513199186883867, + "sensitivity": 0.5202020703876561 + }, + { + "name": "model.layers.14.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.358942482620478e-05, + "sensitivity": 0.7408772260482536 + }, + { + "name": "model.layers.14.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.926201194801251e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007590416353195906, + "sensitivity": 0.5652752001521282 + }, + { + "name": "model.layers.14.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.609877916867845e-05, + "sensitivity": 0.6794691728587788 + }, + { + "name": "model.layers.14.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.864686727363733e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000657767232041806, + "sensitivity": 0.5431134262719224 + }, + { + "name": "model.layers.14.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.664557102136314e-05, + "sensitivity": 0.6824614023494072 + }, + { + "name": "model.layers.14.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.928119316602533e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006928417133167386, + "sensitivity": 0.5689968615973146 + }, + { + "name": "model.layers.14.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.662355033564381e-05, + "sensitivity": 0.6749726561825502 + }, + { + "name": "model.layers.14.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.794695650569338e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006553381681442261, + "sensitivity": 0.5604486985064434 + }, + { + "name": "model.layers.14.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.154500442789868e-05, + "sensitivity": 0.8022074811195576 + }, + { + "name": "model.layers.14.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.735085662512574e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007084164535626769, + "sensitivity": 0.5669361892482073 + }, + { + "name": "model.layers.14.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.247959390748292e-05, + "sensitivity": 0.9025124350299286 + }, + { + "name": "model.layers.14.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.786871153963148e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007416463340632617, + "sensitivity": 0.5700681885147375 + }, + { + "name": "model.layers.14.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.620008960249834e-05, + "sensitivity": 1.062774370364688 + }, + { + "name": "model.layers.14.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.884919573873049e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006454241229221225, + "sensitivity": 0.5545993414816167 + }, + { + "name": "model.layers.14.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.287000021780841e-05, + "sensitivity": 1.0925294053766819 + }, + { + "name": "model.layers.14.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.673954319718177e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006292553152889013, + "sensitivity": 0.5603250454598456 + }, + { + "name": "model.layers.14.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.739732296206057e-05, + "sensitivity": 0.6738209023267594 + }, + { + "name": "model.layers.14.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.981619324302301e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006517893634736538, + "sensitivity": 0.5122537780678572 + }, + { + "name": "model.layers.14.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.948764010099694e-05, + "sensitivity": 0.9349434467936886 + }, + { + "name": "model.layers.14.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.127915526121797e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006851565558463335, + "sensitivity": 0.5357605579627281 + }, + { + "name": "model.layers.14.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006594301084987819, + "sensitivity": 0.5297145633349688 + }, + { + "name": "model.layers.14.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.126947482698597e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006962987827137113, + "sensitivity": 0.5434787173233784 + }, + { + "name": "model.layers.14.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.790558861917816e-05, + "sensitivity": 0.7977648314111919 + }, + { + "name": "model.layers.14.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.557503411386278e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.087414966605138e-05, + "sensitivity": 1.2035736063937292 + }, + { + "name": "model.layers.14.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.896287620998919e-05, + "sensitivity": 0.9557525957032791 + }, + { + "name": "model.layers.14.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.163539865156054e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.165869126562029e-05, + "sensitivity": 0.7768014718071815 + }, + { + "name": "model.layers.14.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6667991884751245e-05, + "sensitivity": 0.7791439410461196 + }, + { + "name": "model.layers.14.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.93195636611199e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006419676938094199, + "sensitivity": 0.5586400002791453 + }, + { + "name": "model.layers.14.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0632708482444286e-05, + "sensitivity": 0.9451040512434385 + }, + { + "name": "model.layers.14.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.179057550070866e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007082949741743505, + "sensitivity": 0.5642976662145509 + }, + { + "name": "model.layers.14.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.34800162515603e-05, + "sensitivity": 0.8535398964823151 + }, + { + "name": "model.layers.14.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.963929308767547e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007346257334575057, + "sensitivity": 0.5932081785876594 + }, + { + "name": "model.layers.14.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.92258402321022e-05, + "sensitivity": 0.8044227687170202 + }, + { + "name": "model.layers.14.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.314308507171518e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006685070693492889, + "sensitivity": 0.5519966258729392 + }, + { + "name": "model.layers.14.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.389514601323754e-05, + "sensitivity": 0.7717215594853437 + }, + { + "name": "model.layers.14.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.733729034953285e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007038887124508619, + "sensitivity": 0.5385640215636607 + }, + { + "name": "model.layers.14.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007099129725247622, + "sensitivity": 0.5127105997568068 + }, + { + "name": "model.layers.14.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.496597393379488e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000729805207811296, + "sensitivity": 0.5351931010254082 + }, + { + "name": "model.layers.14.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006477303104475141, + "sensitivity": 0.5673332553655167 + }, + { + "name": "model.layers.14.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.897617256778176e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006664302200078964, + "sensitivity": 0.5379584180981677 + }, + { + "name": "model.layers.14.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.409410707419738e-05, + "sensitivity": 1.0849564193191377 + }, + { + "name": "model.layers.14.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.692253009532578e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007320276345126331, + "sensitivity": 0.5629348729903022 + }, + { + "name": "model.layers.14.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.960026101092808e-05, + "sensitivity": 0.747871766428573 + }, + { + "name": "model.layers.14.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.359387043630704e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006975971045903862, + "sensitivity": 0.542365921274386 + }, + { + "name": "model.layers.14.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006844731396995485, + "sensitivity": 0.5964761064349269 + }, + { + "name": "model.layers.14.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.470443167927442e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.166138336993754e-05, + "sensitivity": 0.6067881755765269 + }, + { + "name": "model.layers.14.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.785465691587888e-05, + "sensitivity": 0.9866881957447801 + }, + { + "name": "model.layers.14.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.112950359238312e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006773656932637095, + "sensitivity": 0.5441838736242453 + }, + { + "name": "model.layers.14.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007127697463147342, + "sensitivity": 0.5642506327808916 + }, + { + "name": "model.layers.14.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.665838441222149e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.614334415644407e-05, + "sensitivity": 0.9147937003731529 + }, + { + "name": "model.layers.14.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.696304651792161e-05, + "sensitivity": 1.1440209274858266 + }, + { + "name": "model.layers.14.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.144169333310856e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006720131495967507, + "sensitivity": 0.5369806850950664 + }, + { + "name": "model.layers.14.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.904833597014658e-05, + "sensitivity": 0.9660844180499147 + }, + { + "name": "model.layers.14.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.331824238259287e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007056173635646701, + "sensitivity": 0.5369505475446392 + }, + { + "name": "model.layers.14.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.285589188337326e-05, + "sensitivity": 0.6103461003620749 + }, + { + "name": "model.layers.14.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.41807696158503e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007299637654796243, + "sensitivity": 0.5321541192596554 + }, + { + "name": "model.layers.14.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.835774936713278e-05, + "sensitivity": 1.0005837654300196 + }, + { + "name": "model.layers.14.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.325494723569136e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.119506724644452e-05, + "sensitivity": 0.6549636907652477 + }, + { + "name": "model.layers.14.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.878100637346506e-05, + "sensitivity": 0.6482106603955617 + }, + { + "name": "model.layers.14.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.057829864403175e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006944274064153433, + "sensitivity": 0.5356833592698961 + }, + { + "name": "model.layers.14.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.173417932586744e-05, + "sensitivity": 0.871210710111938 + }, + { + "name": "model.layers.14.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.188000381574966e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.371442577801645e-05, + "sensitivity": 0.6996696389132415 + }, + { + "name": "model.layers.14.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 6.352083346428117e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.110377863573376e-06, + "sensitivity": 2.0992645157304297 + }, + { + "name": "model.layers.14.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0223066055914387e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.14.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 6.370866231009131e-06, + "sensitivity": 1.3698959784549751 + }, + { + "name": "model.layers.14.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 2.392660826444626e-05, + "sensitivity": 1.4899908174045529 + }, + { + "name": "model.layers.14.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.0001749361545080319, + "sensitivity": 1.0545815329153554 + }, + { + "name": "model.layers.14.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.3910425877838861e-05, + "sensitivity": 1.5339453268740733 + }, + { + "name": "model.layers.14.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.4254192946245894e-05, + "sensitivity": 0.6604624794646152 + }, + { + "name": "model.layers.14.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00027901766588911414, + "sensitivity": 0.6704371725192947 + }, + { + "name": "model.layers.15.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.994607272441499e-05, + "sensitivity": 0.7222584130196478 + }, + { + "name": "model.layers.15.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.210191259015119e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006863586604595184, + "sensitivity": 0.518342683637294 + }, + { + "name": "model.layers.15.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.186324026202783e-05, + "sensitivity": 0.6702310736584287 + }, + { + "name": "model.layers.15.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.850928002677392e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007217337260954082, + "sensitivity": 0.5282199206508625 + }, + { + "name": "model.layers.15.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0510174433875363e-05, + "sensitivity": 1.2108000531645027 + }, + { + "name": "model.layers.15.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.485654691663512e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006415427196770906, + "sensitivity": 0.59872585789672 + }, + { + "name": "model.layers.15.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.135923467809334e-05, + "sensitivity": 0.6191004746580333 + }, + { + "name": "model.layers.15.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.86376438352454e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007037408649921417, + "sensitivity": 0.565493423806565 + }, + { + "name": "model.layers.15.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7445326092420146e-05, + "sensitivity": 1.0306020483751168 + }, + { + "name": "model.layers.15.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.620583690164494e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006733631598763168, + "sensitivity": 0.5365799198307969 + }, + { + "name": "model.layers.15.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.739625703427009e-05, + "sensitivity": 0.7714115888931953 + }, + { + "name": "model.layers.15.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.04732804276864e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000661818019580096, + "sensitivity": 0.5198987581125166 + }, + { + "name": "model.layers.15.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8745437854668126e-05, + "sensitivity": 0.6666344396106156 + }, + { + "name": "model.layers.15.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.114966820154223e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006629982381127775, + "sensitivity": 0.5073635727340801 + }, + { + "name": "model.layers.15.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000672802678309381, + "sensitivity": 0.5791580512962112 + }, + { + "name": "model.layers.15.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.527840241687954e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006804637378081679, + "sensitivity": 0.5488049421547193 + }, + { + "name": "model.layers.15.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9845457144547254e-05, + "sensitivity": 0.63695721345225 + }, + { + "name": "model.layers.15.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.729562755936058e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00068604142870754, + "sensitivity": 0.5443394920222941 + }, + { + "name": "model.layers.15.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8989440731238574e-05, + "sensitivity": 0.6978506966590899 + }, + { + "name": "model.layers.15.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.454281447076937e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006981170154176652, + "sensitivity": 0.5389050096924505 + }, + { + "name": "model.layers.15.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.747718023485504e-05, + "sensitivity": 0.786252079216689 + }, + { + "name": "model.layers.15.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.584000627502974e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006807716563344002, + "sensitivity": 0.5705604893601834 + }, + { + "name": "model.layers.15.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8597142924554646e-05, + "sensitivity": 0.8332342378279333 + }, + { + "name": "model.layers.15.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.591416763512825e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006561046466231346, + "sensitivity": 0.5961256026774857 + }, + { + "name": "model.layers.15.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0144193765881937e-05, + "sensitivity": 1.7203817598207916 + }, + { + "name": "model.layers.15.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.055945161482668e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000653531402349472, + "sensitivity": 0.5749766275734599 + }, + { + "name": "model.layers.15.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0666636272799224e-05, + "sensitivity": 0.7137081055869655 + }, + { + "name": "model.layers.15.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.643423944296956e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007101005176082253, + "sensitivity": 0.5385740128448679 + }, + { + "name": "model.layers.15.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.98198821535334e-05, + "sensitivity": 1.025194893273494 + }, + { + "name": "model.layers.15.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.188038810250873e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006951174582354724, + "sensitivity": 0.5292173069541033 + }, + { + "name": "model.layers.15.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.816874808166176e-06, + "sensitivity": 1.3075019287924385 + }, + { + "name": "model.layers.15.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.159547751849459e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006726091960445046, + "sensitivity": 0.5345230448306958 + }, + { + "name": "model.layers.15.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0520192518015392e-05, + "sensitivity": 1.2512583744645422 + }, + { + "name": "model.layers.15.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.449577085732017e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006421219441108406, + "sensitivity": 0.559220839342183 + }, + { + "name": "model.layers.15.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9351586969569325e-05, + "sensitivity": 0.9717988654598315 + }, + { + "name": "model.layers.15.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.250061801438278e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000680600933264941, + "sensitivity": 0.5159049905162431 + }, + { + "name": "model.layers.15.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0244619817240164e-05, + "sensitivity": 0.6952996618115642 + }, + { + "name": "model.layers.15.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.026630441941961e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007048847037367523, + "sensitivity": 0.5357826490622595 + }, + { + "name": "model.layers.15.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.183987716212869e-05, + "sensitivity": 0.6837694887297263 + }, + { + "name": "model.layers.15.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.487121027021203e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007006459636613727, + "sensitivity": 0.5345927794970369 + }, + { + "name": "model.layers.15.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0780198863358237e-05, + "sensitivity": 1.8155627927458127 + }, + { + "name": "model.layers.15.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.136965566838626e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006870089564472437, + "sensitivity": 0.5050264926049329 + }, + { + "name": "model.layers.15.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006763748824596405, + "sensitivity": 0.5270647197797189 + }, + { + "name": "model.layers.15.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.412203106265224e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006908592185936868, + "sensitivity": 0.5214844764533157 + }, + { + "name": "model.layers.15.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0896716958086472e-05, + "sensitivity": 1.4311009622013884 + }, + { + "name": "model.layers.15.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.667755994589243e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9597063227556646e-05, + "sensitivity": 0.6374442748788326 + }, + { + "name": "model.layers.15.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.868739026482217e-05, + "sensitivity": 0.7722726482422284 + }, + { + "name": "model.layers.15.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.395239324774593e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006808950565755367, + "sensitivity": 0.5757904912637354 + }, + { + "name": "model.layers.15.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6833185226423666e-05, + "sensitivity": 0.7538190644562284 + }, + { + "name": "model.layers.15.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.309298896667315e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006401796126738191, + "sensitivity": 0.5275963623757483 + }, + { + "name": "model.layers.15.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0073348676087335e-05, + "sensitivity": 1.7188261359347217 + }, + { + "name": "model.layers.15.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.33527804438927e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000663451268337667, + "sensitivity": 0.5678399960370867 + }, + { + "name": "model.layers.15.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006718876538798213, + "sensitivity": 0.5371554134519129 + }, + { + "name": "model.layers.15.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.483032848336734e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006889407522976398, + "sensitivity": 0.5527496592720551 + }, + { + "name": "model.layers.15.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0673548786144238e-05, + "sensitivity": 1.2875203068578505 + }, + { + "name": "model.layers.15.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.865850193411461e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7259032473666593e-05, + "sensitivity": 0.6666493278011713 + }, + { + "name": "model.layers.15.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006617532926611602, + "sensitivity": 0.5308410418079771 + }, + { + "name": "model.layers.15.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.961376470826508e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006734427297487855, + "sensitivity": 0.52839117975544 + }, + { + "name": "model.layers.15.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6158674851758406e-05, + "sensitivity": 1.0869032836146342 + }, + { + "name": "model.layers.15.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.632328108935326e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.667746518156491e-05, + "sensitivity": 0.6334351516311424 + }, + { + "name": "model.layers.15.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006979623576626182, + "sensitivity": 0.5950335926767372 + }, + { + "name": "model.layers.15.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.470006610470591e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007059215568006039, + "sensitivity": 0.5380353412458824 + }, + { + "name": "model.layers.15.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0474260307091754e-05, + "sensitivity": 1.488778685828328 + }, + { + "name": "model.layers.15.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.94450534410862e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006677600322291255, + "sensitivity": 0.5592764205978438 + }, + { + "name": "model.layers.15.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.966002936474979e-05, + "sensitivity": 0.719210013377719 + }, + { + "name": "model.layers.15.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.546755457748077e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007064248202368617, + "sensitivity": 0.5144651927973993 + }, + { + "name": "model.layers.15.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007394430576823652, + "sensitivity": 0.5873456447112639 + }, + { + "name": "model.layers.15.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.407742259601946e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007494264282286167, + "sensitivity": 0.5268109764475678 + }, + { + "name": "model.layers.15.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.671260805684142e-05, + "sensitivity": 0.8382725426594132 + }, + { + "name": "model.layers.15.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.226919365166395e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006523224292322993, + "sensitivity": 0.5063427715694083 + }, + { + "name": "model.layers.15.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.225942343007773e-05, + "sensitivity": 0.8937317281002206 + }, + { + "name": "model.layers.15.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.294214358604222e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007095427718013525, + "sensitivity": 0.5632144840016122 + }, + { + "name": "model.layers.15.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.29457863396965e-05, + "sensitivity": 0.6267379069456496 + }, + { + "name": "model.layers.15.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.732716428814456e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007197781233116984, + "sensitivity": 0.5218558477672534 + }, + { + "name": "model.layers.15.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.552562263095751e-05, + "sensitivity": 0.6168767905555625 + }, + { + "name": "model.layers.15.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.245574806802324e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007641931879334152, + "sensitivity": 0.5653564038807891 + }, + { + "name": "model.layers.15.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007112567545846105, + "sensitivity": 0.539255058865258 + }, + { + "name": "model.layers.15.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.823223657193012e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007275845855474472, + "sensitivity": 0.5039875679866103 + }, + { + "name": "model.layers.15.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.098483572714031e-05, + "sensitivity": 0.6875188267575335 + }, + { + "name": "model.layers.15.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.683962965325918e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007036597235128284, + "sensitivity": 0.5887076964266216 + }, + { + "name": "model.layers.15.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006289802258834243, + "sensitivity": 0.5617961074733278 + }, + { + "name": "model.layers.15.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.364828888967168e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006421259604394436, + "sensitivity": 0.5574332805594381 + }, + { + "name": "model.layers.15.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007081645308062434, + "sensitivity": 0.5533160957196352 + }, + { + "name": "model.layers.15.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.587309826500132e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007438319153152406, + "sensitivity": 0.539178313024078 + }, + { + "name": "model.layers.15.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006866293260827661, + "sensitivity": 0.5195799216321421 + }, + { + "name": "model.layers.15.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.770687832613476e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006985652144066989, + "sensitivity": 0.5522743220937621 + }, + { + "name": "model.layers.15.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.700884503312409e-05, + "sensitivity": 0.9246220210228486 + }, + { + "name": "model.layers.15.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.524982154587633e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006441748701035976, + "sensitivity": 0.5485950780941632 + }, + { + "name": "model.layers.15.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.634455010294914e-05, + "sensitivity": 1.0750183397882769 + }, + { + "name": "model.layers.15.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.878034698980628e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006670739385299385, + "sensitivity": 0.5276572932385426 + }, + { + "name": "model.layers.15.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.919231625739485e-05, + "sensitivity": 0.7827719011553838 + }, + { + "name": "model.layers.15.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.512183290396933e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006541367620229721, + "sensitivity": 0.5387953270855158 + }, + { + "name": "model.layers.15.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.147424574010074e-05, + "sensitivity": 0.8302693002861459 + }, + { + "name": "model.layers.15.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.08785137248924e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007045291131362319, + "sensitivity": 0.5367284826530241 + }, + { + "name": "model.layers.15.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6669668992981315e-05, + "sensitivity": 0.6926407968959543 + }, + { + "name": "model.layers.15.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.408863555407152e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006370587507262826, + "sensitivity": 0.5247276587992393 + }, + { + "name": "model.layers.15.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8764253481058404e-05, + "sensitivity": 0.8065787408252236 + }, + { + "name": "model.layers.15.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.026267556080711e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006722203688696027, + "sensitivity": 0.5203201471665125 + }, + { + "name": "model.layers.15.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.932779095019214e-05, + "sensitivity": 1.0668083518978788 + }, + { + "name": "model.layers.15.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.539365813296172e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007011410198174417, + "sensitivity": 0.5695020308030534 + }, + { + "name": "model.layers.15.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8839719713432714e-05, + "sensitivity": 0.7055598541044223 + }, + { + "name": "model.layers.15.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.34205321148329e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006674338364973664, + "sensitivity": 0.5631078052383575 + }, + { + "name": "model.layers.15.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9319725551176816e-05, + "sensitivity": 0.639544607400257 + }, + { + "name": "model.layers.15.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.43709142877924e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006768115563318133, + "sensitivity": 0.534157741924123 + }, + { + "name": "model.layers.15.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006892151432111859, + "sensitivity": 0.5942508892076761 + }, + { + "name": "model.layers.15.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.678495765299886e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007084048120304942, + "sensitivity": 0.5989733750231335 + }, + { + "name": "model.layers.15.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.110197864472866e-05, + "sensitivity": 0.6921747725382019 + }, + { + "name": "model.layers.15.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.737528105484671e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.469769141403958e-05, + "sensitivity": 0.602647106585502 + }, + { + "name": "model.layers.15.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.861670069862157e-05, + "sensitivity": 1.043134778401197 + }, + { + "name": "model.layers.15.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.943351079120475e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.025646143825725e-05, + "sensitivity": 0.6987595632930697 + }, + { + "name": "model.layers.15.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007297468837350607, + "sensitivity": 0.5233160240022272 + }, + { + "name": "model.layers.15.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.268998842846486e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007600678945891559, + "sensitivity": 0.5305339803931144 + }, + { + "name": "model.layers.15.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.288022268563509e-05, + "sensitivity": 0.8208959248151685 + }, + { + "name": "model.layers.15.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.275188522726239e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007533053867518902, + "sensitivity": 0.5982201714242442 + }, + { + "name": "model.layers.15.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.874945054529235e-05, + "sensitivity": 0.8431647132029618 + }, + { + "name": "model.layers.15.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.83655798638938e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006629276904277503, + "sensitivity": 0.5401363920314699 + }, + { + "name": "model.layers.15.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.249347643461078e-05, + "sensitivity": 0.8622206410447418 + }, + { + "name": "model.layers.15.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.814325388404541e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007317927083931863, + "sensitivity": 0.5590407574600169 + }, + { + "name": "model.layers.15.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.926871017436497e-05, + "sensitivity": 0.6689311863095654 + }, + { + "name": "model.layers.15.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.633374027842365e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006637400947511196, + "sensitivity": 0.5286108844087258 + }, + { + "name": "model.layers.15.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.174673762870952e-05, + "sensitivity": 0.6073003466206639 + }, + { + "name": "model.layers.15.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.652938964180066e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007275479729287326, + "sensitivity": 0.5544971107411215 + }, + { + "name": "model.layers.15.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006651929579675198, + "sensitivity": 0.5109869361719566 + }, + { + "name": "model.layers.15.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.557578444699175e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006787145393900573, + "sensitivity": 0.551704128326464 + }, + { + "name": "model.layers.15.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.017522117763292e-05, + "sensitivity": 1.3252179388578544 + }, + { + "name": "model.layers.15.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.189831651681743e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006417500553652644, + "sensitivity": 0.57655312726986 + }, + { + "name": "model.layers.15.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.915821748203598e-05, + "sensitivity": 0.809203465233935 + }, + { + "name": "model.layers.15.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.093369163158059e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006627162802033126, + "sensitivity": 0.537636664880039 + }, + { + "name": "model.layers.15.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 5.068502105132211e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.096842990795267e-06, + "sensitivity": 2.0993028904456734 + }, + { + "name": "model.layers.15.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.946851840439194e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.15.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.624228389118798e-06, + "sensitivity": 2.1060861603328584 + }, + { + "name": "model.layers.15.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 2.8612088499357924e-05, + "sensitivity": 1.3700640298838076 + }, + { + "name": "model.layers.15.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00018407079915050417, + "sensitivity": 0.9051123402210709 + }, + { + "name": "model.layers.15.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.3551402844313998e-05, + "sensitivity": 1.5183660563573949 + }, + { + "name": "model.layers.15.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.501047053257935e-05, + "sensitivity": 0.7320857509881563 + }, + { + "name": "model.layers.15.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 2, + "mse": 0.0032918842043727636, + "sensitivity": 0.584650092642997 + }, + { + "name": "model.layers.16.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.224007665878162e-05, + "sensitivity": 0.7622516027190953 + }, + { + "name": "model.layers.16.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.99677400461951e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007168391020968556, + "sensitivity": 0.5248118613157358 + }, + { + "name": "model.layers.16.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.051249637384899e-05, + "sensitivity": 1.8241192307702867 + }, + { + "name": "model.layers.16.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.164833052935137e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006576239829882979, + "sensitivity": 0.5377808014534956 + }, + { + "name": "model.layers.16.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.947776298853569e-05, + "sensitivity": 1.072660481692607 + }, + { + "name": "model.layers.16.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.032513510945137e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000680762343108654, + "sensitivity": 0.5396033806421399 + }, + { + "name": "model.layers.16.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.293645856203511e-05, + "sensitivity": 1.0082123755705465 + }, + { + "name": "model.layers.16.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.507331136162975e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.532444240292534e-05, + "sensitivity": 0.6340592480211182 + }, + { + "name": "model.layers.16.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7442863180767745e-05, + "sensitivity": 0.6334673248840488 + }, + { + "name": "model.layers.16.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.202473628036387e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006440478609874845, + "sensitivity": 0.5107838089027863 + }, + { + "name": "model.layers.16.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7089571782853454e-05, + "sensitivity": 1.0556867626329776 + }, + { + "name": "model.layers.16.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.137928494354128e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006477142451331019, + "sensitivity": 0.5330219545914051 + }, + { + "name": "model.layers.16.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0870207916013896e-05, + "sensitivity": 1.7621189401581063 + }, + { + "name": "model.layers.16.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.239447429834399e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.120756734162569e-05, + "sensitivity": 0.6737119427416391 + }, + { + "name": "model.layers.16.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0558631957974285e-05, + "sensitivity": 0.7939732005783025 + }, + { + "name": "model.layers.16.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.324566470539139e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006884997710585594, + "sensitivity": 0.5588543475228145 + }, + { + "name": "model.layers.16.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.381147250067443e-05, + "sensitivity": 0.6220324405777625 + }, + { + "name": "model.layers.16.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.922842885614955e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007228156318888068, + "sensitivity": 0.5518675114024028 + }, + { + "name": "model.layers.16.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9699486882891506e-05, + "sensitivity": 0.6727988508507179 + }, + { + "name": "model.layers.16.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.631183850913658e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006835697568021715, + "sensitivity": 0.5131521128650551 + }, + { + "name": "model.layers.16.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9316236729500815e-05, + "sensitivity": 0.7460597962414103 + }, + { + "name": "model.layers.16.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.25487189154228e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006735550705343485, + "sensitivity": 0.5416022796092522 + }, + { + "name": "model.layers.16.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1173951861565001e-05, + "sensitivity": 1.7284898131136477 + }, + { + "name": "model.layers.16.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.201310268101224e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006732711335644126, + "sensitivity": 0.5582300274660316 + }, + { + "name": "model.layers.16.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8580080803949386e-05, + "sensitivity": 0.6136015476678722 + }, + { + "name": "model.layers.16.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.314456868494744e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006676713819615543, + "sensitivity": 0.5699443393051762 + }, + { + "name": "model.layers.16.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0367940376454499e-05, + "sensitivity": 1.6039350455898633 + }, + { + "name": "model.layers.16.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.007592219248181e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006729345768690109, + "sensitivity": 0.5601310176753704 + }, + { + "name": "model.layers.16.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.173380825202912e-05, + "sensitivity": 0.858333705560047 + }, + { + "name": "model.layers.16.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.856692718632985e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006922126631252468, + "sensitivity": 0.5409565586988434 + }, + { + "name": "model.layers.16.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.026065238984302e-05, + "sensitivity": 1.1452213011450105 + }, + { + "name": "model.layers.16.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.940617135522189e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006945847999304533, + "sensitivity": 0.562063339507686 + }, + { + "name": "model.layers.16.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8704346884042025e-05, + "sensitivity": 0.923586780676567 + }, + { + "name": "model.layers.16.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.747977062739665e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006712715839967132, + "sensitivity": 0.5812517232280876 + }, + { + "name": "model.layers.16.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.755518941441551e-05, + "sensitivity": 0.8033317836243861 + }, + { + "name": "model.layers.16.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.553217986038362e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006370461778715253, + "sensitivity": 0.5558259148968988 + }, + { + "name": "model.layers.16.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.466080958489329e-05, + "sensitivity": 0.6056524111878661 + }, + { + "name": "model.layers.16.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.011951197455346e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007561428938060999, + "sensitivity": 0.5286861239144487 + }, + { + "name": "model.layers.16.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.020119326421991e-05, + "sensitivity": 0.820036150750267 + }, + { + "name": "model.layers.16.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.616886594201787e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006675976328551769, + "sensitivity": 0.5637410897346853 + }, + { + "name": "model.layers.16.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.606413469649851e-05, + "sensitivity": 1.0206227700385815 + }, + { + "name": "model.layers.16.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.257133691178751e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006100676255300641, + "sensitivity": 0.5533873770644027 + }, + { + "name": "model.layers.16.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.810125730931759e-05, + "sensitivity": 0.7463528146936594 + }, + { + "name": "model.layers.16.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.358858399835299e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006521352916024625, + "sensitivity": 0.5029004422347407 + }, + { + "name": "model.layers.16.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.744745067204349e-05, + "sensitivity": 0.9352001394445356 + }, + { + "name": "model.layers.16.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.2455649185722e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006613858859054744, + "sensitivity": 0.5298392671548894 + }, + { + "name": "model.layers.16.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0113650205312297e-05, + "sensitivity": 1.5449250102156142 + }, + { + "name": "model.layers.16.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.553285629706807e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006284556584432721, + "sensitivity": 0.5135888500017207 + }, + { + "name": "model.layers.16.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1078844181611203e-05, + "sensitivity": 1.3667565224461504 + }, + { + "name": "model.layers.16.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.398203140633996e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006851805374026299, + "sensitivity": 0.5227850398796935 + }, + { + "name": "model.layers.16.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.2076353616284905e-06, + "sensitivity": 2.0972363005800454 + }, + { + "name": "model.layers.16.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.479129979197751e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5939693993423134e-05, + "sensitivity": 0.6324605288097305 + }, + { + "name": "model.layers.16.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0669080438674428e-05, + "sensitivity": 1.3293120152573434 + }, + { + "name": "model.layers.16.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.307152489171131e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006704523111693561, + "sensitivity": 0.5361192619787151 + }, + { + "name": "model.layers.16.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8492543757893145e-05, + "sensitivity": 0.9211756706834802 + }, + { + "name": "model.layers.16.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.983250730423606e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006758067756891251, + "sensitivity": 0.5063142945484759 + }, + { + "name": "model.layers.16.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0047905561805237e-05, + "sensitivity": 1.5393984048174307 + }, + { + "name": "model.layers.16.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.586315516367904e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.541136488318443e-05, + "sensitivity": 0.8025940347922969 + }, + { + "name": "model.layers.16.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9697613323805854e-05, + "sensitivity": 0.7363442024025337 + }, + { + "name": "model.layers.16.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.463551471824758e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006952823023311794, + "sensitivity": 0.5672486211418577 + }, + { + "name": "model.layers.16.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.38408018858172e-05, + "sensitivity": 0.6606060479067855 + }, + { + "name": "model.layers.16.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.18600972504646e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007339600706472993, + "sensitivity": 0.5559623614159559 + }, + { + "name": "model.layers.16.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.814270116388798e-05, + "sensitivity": 0.6805270400195826 + }, + { + "name": "model.layers.16.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.475040663644904e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006427834159694612, + "sensitivity": 0.5484675777670553 + }, + { + "name": "model.layers.16.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.84356821491383e-05, + "sensitivity": 0.6145359931167024 + }, + { + "name": "model.layers.16.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.211458523670444e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006382351275533438, + "sensitivity": 0.5370975642277902 + }, + { + "name": "model.layers.16.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.940280971117318e-05, + "sensitivity": 0.7462425145519284 + }, + { + "name": "model.layers.16.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.605328053410631e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006665957043878734, + "sensitivity": 0.5283042243086359 + }, + { + "name": "model.layers.16.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.752585275331512e-05, + "sensitivity": 0.7379784692332823 + }, + { + "name": "model.layers.16.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.310942808340769e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006447491468861699, + "sensitivity": 0.5550016903948796 + }, + { + "name": "model.layers.16.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.645742567139678e-05, + "sensitivity": 1.172285555627954 + }, + { + "name": "model.layers.16.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.88688749303401e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7911762269213796e-05, + "sensitivity": 0.6309909780526053 + }, + { + "name": "model.layers.16.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.300717359408736e-05, + "sensitivity": 0.8664109912423372 + }, + { + "name": "model.layers.16.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.887637482577702e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007167315925471485, + "sensitivity": 0.5505814863130034 + }, + { + "name": "model.layers.16.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9461279306560755e-05, + "sensitivity": 0.8615633044385057 + }, + { + "name": "model.layers.16.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.572195386273961e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006708133732900023, + "sensitivity": 0.5144160595317004 + }, + { + "name": "model.layers.16.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1186213669134304e-05, + "sensitivity": 1.3380817644223888 + }, + { + "name": "model.layers.16.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.396262731163006e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.253429455682635e-05, + "sensitivity": 0.6534634755127516 + }, + { + "name": "model.layers.16.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.16069883108139e-05, + "sensitivity": 0.740252352819635 + }, + { + "name": "model.layers.16.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.485831249847251e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000720726209692657, + "sensitivity": 0.5380575499851006 + }, + { + "name": "model.layers.16.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.470935477409512e-05, + "sensitivity": 0.6533798209359893 + }, + { + "name": "model.layers.16.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.829277481301688e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007430700352415442, + "sensitivity": 0.5148189559091219 + }, + { + "name": "model.layers.16.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.958662222838029e-05, + "sensitivity": 1.0275289255908038 + }, + { + "name": "model.layers.16.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.302530550783558e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006989281973801553, + "sensitivity": 0.5293197836080618 + }, + { + "name": "model.layers.16.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.243934330996126e-05, + "sensitivity": 0.8929478861105288 + }, + { + "name": "model.layers.16.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.634471674260567e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007526380941271782, + "sensitivity": 0.5967748440939219 + }, + { + "name": "model.layers.16.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.233464955585077e-05, + "sensitivity": 0.8087718861007984 + }, + { + "name": "model.layers.16.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.27963901883777e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007232515490613878, + "sensitivity": 0.5286389244954715 + }, + { + "name": "model.layers.16.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006920963060110807, + "sensitivity": 0.5512342099738426 + }, + { + "name": "model.layers.16.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.507995635729458e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.34663738310337e-05, + "sensitivity": 0.6064900909221628 + }, + { + "name": "model.layers.16.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.940424671280198e-05, + "sensitivity": 0.9071120025872312 + }, + { + "name": "model.layers.16.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.515417112495925e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006915563717484474, + "sensitivity": 0.5518233297597829 + }, + { + "name": "model.layers.16.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006993203423917294, + "sensitivity": 0.543731819991625 + }, + { + "name": "model.layers.16.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.624755997108878e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007003572536632419, + "sensitivity": 0.5216498852022691 + }, + { + "name": "model.layers.16.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.893694469705224e-05, + "sensitivity": 1.163535719994436 + }, + { + "name": "model.layers.16.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.983559839885856e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006353619392029941, + "sensitivity": 0.5363005239013103 + }, + { + "name": "model.layers.16.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.980298010399565e-05, + "sensitivity": 0.6862804858627635 + }, + { + "name": "model.layers.16.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.854658067823038e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006889039068482816, + "sensitivity": 0.5494394972806245 + }, + { + "name": "model.layers.16.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.916407098993659e-05, + "sensitivity": 0.86314044657983 + }, + { + "name": "model.layers.16.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.821698548264976e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006539043388329446, + "sensitivity": 0.5379688237251222 + }, + { + "name": "model.layers.16.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0370730706199538e-05, + "sensitivity": 1.2308131489237273 + }, + { + "name": "model.layers.16.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.241212642838946e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006290421588346362, + "sensitivity": 0.5582040820541858 + }, + { + "name": "model.layers.16.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.180873606353998e-05, + "sensitivity": 0.6038814559336257 + }, + { + "name": "model.layers.16.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.1667221845928e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007383663905784488, + "sensitivity": 0.5364714927832408 + }, + { + "name": "model.layers.16.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.622814205707982e-05, + "sensitivity": 0.7941584887227643 + }, + { + "name": "model.layers.16.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.910745469212998e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006423332961276174, + "sensitivity": 0.5263160228557003 + }, + { + "name": "model.layers.16.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.965585296507925e-05, + "sensitivity": 1.0211933124618053 + }, + { + "name": "model.layers.16.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.19108675437019e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000695787079166621, + "sensitivity": 0.5304205640076206 + }, + { + "name": "model.layers.16.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.85659799980931e-05, + "sensitivity": 0.8198009253999988 + }, + { + "name": "model.layers.16.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.803263315508957e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006479301955550909, + "sensitivity": 0.5669179715038588 + }, + { + "name": "model.layers.16.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.010620326269418e-05, + "sensitivity": 1.284011090424262 + }, + { + "name": "model.layers.16.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.59567831462482e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006377120735123754, + "sensitivity": 0.573647598485387 + }, + { + "name": "model.layers.16.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0660477528290357e-05, + "sensitivity": 1.3599113478203024 + }, + { + "name": "model.layers.16.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.004345323162852e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.017376290401444e-05, + "sensitivity": 0.6059890860384428 + }, + { + "name": "model.layers.16.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0238740843487903e-05, + "sensitivity": 0.6204496658100933 + }, + { + "name": "model.layers.16.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.369016318785725e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006777895032428205, + "sensitivity": 0.5014591099880235 + }, + { + "name": "model.layers.16.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.2407461983675603e-06, + "sensitivity": 2.096873391205192 + }, + { + "name": "model.layers.16.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.220504928933224e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006529337260872126, + "sensitivity": 0.5163212813682768 + }, + { + "name": "model.layers.16.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3890338525234256e-06, + "sensitivity": 2.097715419328279 + }, + { + "name": "model.layers.16.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.730141528052627e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.0213533641945105e-05, + "sensitivity": 1.52005590177854 + }, + { + "name": "model.layers.16.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0216695045528468e-05, + "sensitivity": 1.5350672538108254 + }, + { + "name": "model.layers.16.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.185695724525431e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006312135374173522, + "sensitivity": 0.53095998603451 + }, + { + "name": "model.layers.16.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.834804586716928e-06, + "sensitivity": 1.5334269603074893 + }, + { + "name": "model.layers.16.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.244143264666491e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006616059690713882, + "sensitivity": 0.5689208304008302 + }, + { + "name": "model.layers.16.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0624817150528543e-05, + "sensitivity": 1.4982229481795808 + }, + { + "name": "model.layers.16.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.692062465343042e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9069057897431776e-05, + "sensitivity": 0.6119276156103577 + }, + { + "name": "model.layers.16.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.164208753034472e-05, + "sensitivity": 0.8475410257202107 + }, + { + "name": "model.layers.16.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.746303142790566e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006919795414432883, + "sensitivity": 0.5205755812746475 + }, + { + "name": "model.layers.16.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 4.747220373246819e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.442612185404869e-06, + "sensitivity": 2.1001073616711112 + }, + { + "name": "model.layers.16.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.374741019499197e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.16.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 7.257636298163561e-06, + "sensitivity": 1.6828009108730246 + }, + { + "name": "model.layers.16.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 2.71807311946759e-05, + "sensitivity": 1.797561079238254 + }, + { + "name": "model.layers.16.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00018194885342381895, + "sensitivity": 1.1874689527676952 + }, + { + "name": "model.layers.16.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.416656141373096e-05, + "sensitivity": 1.8298546480569817 + }, + { + "name": "model.layers.16.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 2, + "mse": 0.0006541988113895059, + "sensitivity": 0.5777880551599879 + }, + { + "name": "model.layers.16.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002798729983624071, + "sensitivity": 0.790146251878931 + }, + { + "name": "model.layers.17.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.461681212182157e-05, + "sensitivity": 1.151454438043213 + }, + { + "name": "model.layers.17.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.915574992191978e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.100803537061438e-05, + "sensitivity": 0.6356711407159794 + }, + { + "name": "model.layers.17.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.763858644058928e-05, + "sensitivity": 1.174517656863229 + }, + { + "name": "model.layers.17.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.190096423277282e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006631982396356761, + "sensitivity": 0.5995058068510188 + }, + { + "name": "model.layers.17.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.942638381384313e-05, + "sensitivity": 0.7830205244900724 + }, + { + "name": "model.layers.17.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.34068499039131e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000649512221571058, + "sensitivity": 0.5408508486887205 + }, + { + "name": "model.layers.17.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.694153050077148e-06, + "sensitivity": 1.5983556206892835 + }, + { + "name": "model.layers.17.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.686628128387383e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006020100554451346, + "sensitivity": 0.5458063913954572 + }, + { + "name": "model.layers.17.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7007760915439576e-05, + "sensitivity": 0.7337705164741607 + }, + { + "name": "model.layers.17.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.524095397253404e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006283242255449295, + "sensitivity": 0.5857165805012349 + }, + { + "name": "model.layers.17.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0138053767150268e-05, + "sensitivity": 1.9167523058124152 + }, + { + "name": "model.layers.17.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.02690931827965e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006396063836291432, + "sensitivity": 0.5439536042420762 + }, + { + "name": "model.layers.17.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.695772051694803e-05, + "sensitivity": 0.9432880318128534 + }, + { + "name": "model.layers.17.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.699951882183086e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006466718623414636, + "sensitivity": 0.5168436062189641 + }, + { + "name": "model.layers.17.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.427567859645933e-05, + "sensitivity": 0.6621922535336049 + }, + { + "name": "model.layers.17.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.201458060990262e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007266198517754674, + "sensitivity": 0.5931764717354802 + }, + { + "name": "model.layers.17.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000658202450722456, + "sensitivity": 0.5742352138749492 + }, + { + "name": "model.layers.17.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.731917778779462e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006595224840566516, + "sensitivity": 0.5249970578192116 + }, + { + "name": "model.layers.17.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.664453419740312e-05, + "sensitivity": 0.7764982184144552 + }, + { + "name": "model.layers.17.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.434507776655664e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006113043637014925, + "sensitivity": 0.5226617186738426 + }, + { + "name": "model.layers.17.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.879476884729229e-05, + "sensitivity": 0.6170873723547927 + }, + { + "name": "model.layers.17.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.265488536882913e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006203338271006942, + "sensitivity": 0.5675976918542521 + }, + { + "name": "model.layers.17.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9159850934520364e-05, + "sensitivity": 1.026000970023668 + }, + { + "name": "model.layers.17.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.800379873719066e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006389596965163946, + "sensitivity": 0.5482815266911795 + }, + { + "name": "model.layers.17.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.08663831371814e-05, + "sensitivity": 0.6288514674864552 + }, + { + "name": "model.layers.17.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.346105803662795e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006402774015441537, + "sensitivity": 0.5306204714186682 + }, + { + "name": "model.layers.17.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.67998577025719e-05, + "sensitivity": 0.8081746682443737 + }, + { + "name": "model.layers.17.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.009775006532436e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006519716698676348, + "sensitivity": 0.5540296055686726 + }, + { + "name": "model.layers.17.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006623428780585527, + "sensitivity": 0.5547119502242439 + }, + { + "name": "model.layers.17.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.736190354989958e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006428458727896214, + "sensitivity": 0.5615429345929436 + }, + { + "name": "model.layers.17.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.774344754172489e-05, + "sensitivity": 0.7919193025022436 + }, + { + "name": "model.layers.17.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.553038360834762e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006519687594845891, + "sensitivity": 0.5037889168940924 + }, + { + "name": "model.layers.17.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006582130445167422, + "sensitivity": 0.5884579386422247 + }, + { + "name": "model.layers.17.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.47045226287446e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006305359420366585, + "sensitivity": 0.5544184120270401 + }, + { + "name": "model.layers.17.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.441049481509253e-05, + "sensitivity": 0.6376701063898348 + }, + { + "name": "model.layers.17.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.233214430219959e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007164077833294868, + "sensitivity": 0.5338096264520903 + }, + { + "name": "model.layers.17.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.715937732020393e-05, + "sensitivity": 0.9172693707739412 + }, + { + "name": "model.layers.17.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.651352689208579e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005984754534438252, + "sensitivity": 0.5336748171908345 + }, + { + "name": "model.layers.17.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0892067621171009e-05, + "sensitivity": 1.6817516014502076 + }, + { + "name": "model.layers.17.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.447984901569725e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006777711096219718, + "sensitivity": 0.5436274778331136 + }, + { + "name": "model.layers.17.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.710002369596623e-05, + "sensitivity": 0.7194716015062326 + }, + { + "name": "model.layers.17.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.93953586758289e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.636378045892343e-05, + "sensitivity": 0.6153335924527803 + }, + { + "name": "model.layers.17.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.00907915213611e-05, + "sensitivity": 0.620853623199941 + }, + { + "name": "model.layers.17.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.194048864927026e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006885076873004436, + "sensitivity": 0.533382873994215 + }, + { + "name": "model.layers.17.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006961270119063556, + "sensitivity": 0.5666537562609729 + }, + { + "name": "model.layers.17.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.40997086520656e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007009388646110892, + "sensitivity": 0.5703549361073157 + }, + { + "name": "model.layers.17.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3439213236997603e-06, + "sensitivity": 2.0976021677471124 + }, + { + "name": "model.layers.17.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.894067953704507e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 9.732872058521025e-06, + "sensitivity": 1.562903490334871 + }, + { + "name": "model.layers.17.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.834762123413384e-05, + "sensitivity": 0.9080809477354591 + }, + { + "name": "model.layers.17.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.291977570072049e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.672841507475823e-05, + "sensitivity": 0.7877390239504237 + }, + { + "name": "model.layers.17.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.102569750510156e-05, + "sensitivity": 0.6210772502689668 + }, + { + "name": "model.layers.17.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.181667681128602e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006843460141681135, + "sensitivity": 0.5509152805875681 + }, + { + "name": "model.layers.17.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.276821659412235e-05, + "sensitivity": 0.6587780713946526 + }, + { + "name": "model.layers.17.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.800914889026899e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007179062813520432, + "sensitivity": 0.5862407605159811 + }, + { + "name": "model.layers.17.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006611388525925577, + "sensitivity": 0.5252051398160225 + }, + { + "name": "model.layers.17.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.713815992043237e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006474414258264005, + "sensitivity": 0.5050988182100243 + }, + { + "name": "model.layers.17.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.058056897018105e-05, + "sensitivity": 1.177174087162951 + }, + { + "name": "model.layers.17.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.875524150018464e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000650999543722719, + "sensitivity": 0.5251301468706358 + }, + { + "name": "model.layers.17.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0530514373385813e-05, + "sensitivity": 1.5842469916583917 + }, + { + "name": "model.layers.17.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.811603831622051e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7315977755934e-05, + "sensitivity": 0.7436154565957124 + }, + { + "name": "model.layers.17.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.847142165293917e-05, + "sensitivity": 1.101884860574121 + }, + { + "name": "model.layers.17.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.474450735069695e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006436347030103207, + "sensitivity": 0.5322176757689444 + }, + { + "name": "model.layers.17.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.93807635596022e-05, + "sensitivity": 1.0370299242741041 + }, + { + "name": "model.layers.17.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.254906566027785e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006772837368771434, + "sensitivity": 0.5677893643499271 + }, + { + "name": "model.layers.17.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.16779361735098e-05, + "sensitivity": 0.9486640080449331 + }, + { + "name": "model.layers.17.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.372735808530706e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.165822560433298e-05, + "sensitivity": 1.0037833137942231 + }, + { + "name": "model.layers.17.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.760196290793829e-05, + "sensitivity": 0.7893227499325983 + }, + { + "name": "model.layers.17.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.011619007040281e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006356735830195248, + "sensitivity": 0.5258507519853087 + }, + { + "name": "model.layers.17.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.834869443788193e-05, + "sensitivity": 0.6837414910689024 + }, + { + "name": "model.layers.17.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.291817271630862e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006791178020648658, + "sensitivity": 0.5059063290458099 + }, + { + "name": "model.layers.17.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0678835678845644e-05, + "sensitivity": 1.8767796553629852 + }, + { + "name": "model.layers.17.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.930635774755501e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.945742304902524e-05, + "sensitivity": 0.7072075246606853 + }, + { + "name": "model.layers.17.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.784354289062321e-05, + "sensitivity": 0.8751870099338668 + }, + { + "name": "model.layers.17.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.504887437586149e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006269905716180801, + "sensitivity": 0.5295267307291349 + }, + { + "name": "model.layers.17.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.142198981251568e-05, + "sensitivity": 0.7658130700756512 + }, + { + "name": "model.layers.17.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.061089490889572e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006967309745959938, + "sensitivity": 0.5733702117559542 + }, + { + "name": "model.layers.17.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.649836384691298e-05, + "sensitivity": 0.645518020930572 + }, + { + "name": "model.layers.17.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.31742318293982e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006117822485975921, + "sensitivity": 0.5343230827658222 + }, + { + "name": "model.layers.17.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8883637393591926e-05, + "sensitivity": 0.7705049663845809 + }, + { + "name": "model.layers.17.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.639845651079668e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006290716701187193, + "sensitivity": 0.5574654041865902 + }, + { + "name": "model.layers.17.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.342941196635365e-05, + "sensitivity": 0.639438644382427 + }, + { + "name": "model.layers.17.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.797791792858334e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006952762487344444, + "sensitivity": 0.5359232275104066 + }, + { + "name": "model.layers.17.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.054902041796595e-05, + "sensitivity": 1.0202000668575857 + }, + { + "name": "model.layers.17.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.129860364329943e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006589122349396348, + "sensitivity": 0.5478949994605301 + }, + { + "name": "model.layers.17.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000627960660494864, + "sensitivity": 0.5781699387128405 + }, + { + "name": "model.layers.17.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.897440473745519e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006212025764398277, + "sensitivity": 0.541987038918099 + }, + { + "name": "model.layers.17.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.67412753298413e-05, + "sensitivity": 0.9378394397055718 + }, + { + "name": "model.layers.17.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.182655170050566e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006428157212212682, + "sensitivity": 0.5573615511785233 + }, + { + "name": "model.layers.17.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6108878197846934e-05, + "sensitivity": 0.7681429854688511 + }, + { + "name": "model.layers.17.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.215909706952516e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006190197309479117, + "sensitivity": 0.5421675364844715 + }, + { + "name": "model.layers.17.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006322422996163368, + "sensitivity": 0.5825416481090596 + }, + { + "name": "model.layers.17.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.144218443499994e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000608837406616658, + "sensitivity": 0.5627624371573587 + }, + { + "name": "model.layers.17.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.821273953188211e-05, + "sensitivity": 0.7563552375785675 + }, + { + "name": "model.layers.17.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.227694022229116e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006587868556380272, + "sensitivity": 0.5321168255039567 + }, + { + "name": "model.layers.17.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.549153476953506e-05, + "sensitivity": 0.6747816374028743 + }, + { + "name": "model.layers.17.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.498210834455676e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.658980419160798e-05, + "sensitivity": 0.6252292672736375 + }, + { + "name": "model.layers.17.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.245174881769344e-05, + "sensitivity": 0.6949560853123437 + }, + { + "name": "model.layers.17.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.27837345948501e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006979770842008293, + "sensitivity": 0.5594577157493668 + }, + { + "name": "model.layers.17.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.071096140658483e-05, + "sensitivity": 0.7457553190864783 + }, + { + "name": "model.layers.17.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.893008048791671e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006663856329396367, + "sensitivity": 0.545709366578931 + }, + { + "name": "model.layers.17.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.301885878201574e-05, + "sensitivity": 0.923478507635145 + }, + { + "name": "model.layers.17.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.490065172532923e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007025778177194297, + "sensitivity": 0.5621249183523455 + }, + { + "name": "model.layers.17.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.129941175458953e-05, + "sensitivity": 0.8983354546263549 + }, + { + "name": "model.layers.17.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.473069333878811e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006853108061477542, + "sensitivity": 0.5334267560694557 + }, + { + "name": "model.layers.17.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.019386273692362e-05, + "sensitivity": 0.710014859306038 + }, + { + "name": "model.layers.17.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.708743853778287e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006713730981573462, + "sensitivity": 0.5702314604031804 + }, + { + "name": "model.layers.17.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0048500017728657e-05, + "sensitivity": 0.925235090208558 + }, + { + "name": "model.layers.17.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.170561613951577e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006477349670603871, + "sensitivity": 0.5489651717916565 + }, + { + "name": "model.layers.17.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0826550907222554e-05, + "sensitivity": 1.1169045384933298 + }, + { + "name": "model.layers.17.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.425049718927767e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006834546802565455, + "sensitivity": 0.5195055495730968 + }, + { + "name": "model.layers.17.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9187004808336496e-05, + "sensitivity": 0.6806627344155791 + }, + { + "name": "model.layers.17.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.8405438469199e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.882571713300422e-05, + "sensitivity": 0.6556232375451173 + }, + { + "name": "model.layers.17.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0958703569485806e-05, + "sensitivity": 1.9618750655922863 + }, + { + "name": "model.layers.17.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.005975817264698e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.017718624207191e-05, + "sensitivity": 0.6963224927881758 + }, + { + "name": "model.layers.17.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0493822628632188e-05, + "sensitivity": 1.3500542214175666 + }, + { + "name": "model.layers.17.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.978637886983051e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006500994204543531, + "sensitivity": 0.5165258784337132 + }, + { + "name": "model.layers.17.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0245995326840784e-05, + "sensitivity": 1.3864155420644437 + }, + { + "name": "model.layers.17.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.195719374270993e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006033016834408045, + "sensitivity": 0.5876128691364909 + }, + { + "name": "model.layers.17.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.776685429736972e-05, + "sensitivity": 0.7260174543741545 + }, + { + "name": "model.layers.17.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.955030471544887e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006350442999973893, + "sensitivity": 0.5302609053864664 + }, + { + "name": "model.layers.17.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006481326417997479, + "sensitivity": 0.5699507435652847 + }, + { + "name": "model.layers.17.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.010718263700255e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006273322505876422, + "sensitivity": 0.5284880173368678 + }, + { + "name": "model.layers.17.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.475819751969539e-06, + "sensitivity": 1.4701865436142239 + }, + { + "name": "model.layers.17.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.059678637233446e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005914315115660429, + "sensitivity": 0.5495195233348713 + }, + { + "name": "model.layers.17.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0014749932452105e-05, + "sensitivity": 1.2056754242335344 + }, + { + "name": "model.layers.17.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.880374030515668e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005961160641163588, + "sensitivity": 0.5604861225924612 + }, + { + "name": "model.layers.17.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.247349665500224e-05, + "sensitivity": 0.6988311843576372 + }, + { + "name": "model.layers.17.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.048560064504272e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006946692592464387, + "sensitivity": 0.5204266215296154 + }, + { + "name": "model.layers.17.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 4.2312321966164745e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.283136382175144e-06, + "sensitivity": 2.0994290748661903 + }, + { + "name": "model.layers.17.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.502608241338748e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.17.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.6655742456350708e-06, + "sensitivity": 2.104987972588769 + }, + { + "name": "model.layers.17.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 7.748869393253699e-06, + "sensitivity": 2.1908353113184993 + }, + { + "name": "model.layers.17.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00018019579874817282, + "sensitivity": 0.9132328670365855 + }, + { + "name": "model.layers.17.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.564079684612807e-05, + "sensitivity": 1.0788967496537367 + }, + { + "name": "model.layers.17.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.937926107435487e-05, + "sensitivity": 0.657307615601148 + }, + { + "name": "model.layers.17.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002681644109543413, + "sensitivity": 0.6941153772929682 + }, + { + "name": "model.layers.18.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3768755606142804e-05, + "sensitivity": 1.0683910817319835 + }, + { + "name": "model.layers.18.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.720752369597903e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006155906594358385, + "sensitivity": 0.5214875862910846 + }, + { + "name": "model.layers.18.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.718937609344721e-05, + "sensitivity": 0.8210119567374976 + }, + { + "name": "model.layers.18.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.745857490386697e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006240094662643969, + "sensitivity": 0.5435873161001123 + }, + { + "name": "model.layers.18.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.224722892511636e-05, + "sensitivity": 0.7623165971387024 + }, + { + "name": "model.layers.18.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.156503443184192e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007105501717887819, + "sensitivity": 0.5466298288242215 + }, + { + "name": "model.layers.18.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0061551620310638e-05, + "sensitivity": 1.9632300221385734 + }, + { + "name": "model.layers.18.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.652941013067903e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006156706949695945, + "sensitivity": 0.5590213418084131 + }, + { + "name": "model.layers.18.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006565309013240039, + "sensitivity": 0.5813253206507992 + }, + { + "name": "model.layers.18.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.725742309754423e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006417898694053292, + "sensitivity": 0.5401969281153957 + }, + { + "name": "model.layers.18.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.323415436781943e-05, + "sensitivity": 0.9330909836704775 + }, + { + "name": "model.layers.18.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.677225314888346e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007071642903611064, + "sensitivity": 0.5581833857689203 + }, + { + "name": "model.layers.18.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.699681059923023e-05, + "sensitivity": 1.1443021569897265 + }, + { + "name": "model.layers.18.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.25515781393915e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006487325299531221, + "sensitivity": 0.5840361352056971 + }, + { + "name": "model.layers.18.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7568664487916976e-05, + "sensitivity": 0.9337006493647872 + }, + { + "name": "model.layers.18.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.178601665851602e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006650621071457863, + "sensitivity": 0.5563182549170671 + }, + { + "name": "model.layers.18.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006934432312846184, + "sensitivity": 0.5389218499158244 + }, + { + "name": "model.layers.18.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.231537099665729e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000681681209243834, + "sensitivity": 0.5698356111088878 + }, + { + "name": "model.layers.18.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.191273779317271e-06, + "sensitivity": 2.0971314217160186 + }, + { + "name": "model.layers.18.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.8265524078015e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.369901919038966e-05, + "sensitivity": 0.8816863841051026 + }, + { + "name": "model.layers.18.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.147066596895456e-05, + "sensitivity": 0.622258677484572 + }, + { + "name": "model.layers.18.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.287692713158322e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006758943200111389, + "sensitivity": 0.5466854950093959 + }, + { + "name": "model.layers.18.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.696806329069659e-05, + "sensitivity": 0.6067905940874736 + }, + { + "name": "model.layers.18.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.368100452571525e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006174708832986653, + "sensitivity": 0.5780204098313948 + }, + { + "name": "model.layers.18.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.838385550305247e-05, + "sensitivity": 0.6939487178140951 + }, + { + "name": "model.layers.18.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.381583711525309e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006472686072811484, + "sensitivity": 0.5255976296168394 + }, + { + "name": "model.layers.18.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.645816418109462e-05, + "sensitivity": 0.88480288706704 + }, + { + "name": "model.layers.18.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.5531036120301e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006242530071176589, + "sensitivity": 0.5361110409328683 + }, + { + "name": "model.layers.18.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006980095058679581, + "sensitivity": 0.5251848879563237 + }, + { + "name": "model.layers.18.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.535058443863818e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000700572389177978, + "sensitivity": 0.5626738967886133 + }, + { + "name": "model.layers.18.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1446299140516203e-05, + "sensitivity": 1.363656486968438 + }, + { + "name": "model.layers.18.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.483998842872097e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.117915780923795e-05, + "sensitivity": 1.4365983999059246 + }, + { + "name": "model.layers.18.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9938058257102966e-05, + "sensitivity": 0.7584460134545417 + }, + { + "name": "model.layers.18.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.218741527343809e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006461074808612466, + "sensitivity": 0.5545205321885806 + }, + { + "name": "model.layers.18.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.768123082816601e-05, + "sensitivity": 0.7120516206771208 + }, + { + "name": "model.layers.18.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.957709158290527e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006421735743060708, + "sensitivity": 0.5526392376418194 + }, + { + "name": "model.layers.18.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007191387703642249, + "sensitivity": 0.5527646894422348 + }, + { + "name": "model.layers.18.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.733192433079239e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007219755789265037, + "sensitivity": 0.5350909189817061 + }, + { + "name": "model.layers.18.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.093248521210626e-05, + "sensitivity": 0.7774306028741368 + }, + { + "name": "model.layers.18.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.535520924444427e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006799651309847832, + "sensitivity": 0.545475869232167 + }, + { + "name": "model.layers.18.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.816043267259374e-05, + "sensitivity": 1.1710794510465827 + }, + { + "name": "model.layers.18.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.433490054609138e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006353770149871707, + "sensitivity": 0.5431730878568697 + }, + { + "name": "model.layers.18.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0106734407600015e-05, + "sensitivity": 1.6832395978520736 + }, + { + "name": "model.layers.18.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.611265798208478e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.489853720064275e-05, + "sensitivity": 0.9629650798706694 + }, + { + "name": "model.layers.18.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006627370603382587, + "sensitivity": 0.5768224645609046 + }, + { + "name": "model.layers.18.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.270374797168188e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006388802430592477, + "sensitivity": 0.5486702356002139 + }, + { + "name": "model.layers.18.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.68132491025608e-05, + "sensitivity": 0.6102596762798426 + }, + { + "name": "model.layers.18.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.751148925512098e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006150329136289656, + "sensitivity": 0.5135808253744026 + }, + { + "name": "model.layers.18.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.125067011453211e-05, + "sensitivity": 1.0584423972168922 + }, + { + "name": "model.layers.18.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.17971988201316e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006934773991815746, + "sensitivity": 0.5352620268877318 + }, + { + "name": "model.layers.18.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.424254388548434e-05, + "sensitivity": 0.7771946257072306 + }, + { + "name": "model.layers.18.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.239402179948229e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007157858344726264, + "sensitivity": 0.5463998723360118 + }, + { + "name": "model.layers.18.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.234878674149513e-05, + "sensitivity": 0.9960398248431956 + }, + { + "name": "model.layers.18.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.754192665743176e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.146671512397006e-05, + "sensitivity": 0.6016391237800286 + }, + { + "name": "model.layers.18.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.030965596437454e-05, + "sensitivity": 0.9749665585819647 + }, + { + "name": "model.layers.18.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.50480865008285e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006809992482885718, + "sensitivity": 0.537252745106604 + }, + { + "name": "model.layers.18.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0353046137606725e-05, + "sensitivity": 1.135109142448228 + }, + { + "name": "model.layers.18.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.852235626160109e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006965158390812576, + "sensitivity": 0.5591972827921904 + }, + { + "name": "model.layers.18.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0989504517056048e-05, + "sensitivity": 1.2584627837293307 + }, + { + "name": "model.layers.18.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.290878324463847e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006513729458674788, + "sensitivity": 0.5447699725165202 + }, + { + "name": "model.layers.18.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.773509474238381e-05, + "sensitivity": 1.0510728013324637 + }, + { + "name": "model.layers.18.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.106434847832134e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006292964098975062, + "sensitivity": 0.5731517845213719 + }, + { + "name": "model.layers.18.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.718658212572336e-05, + "sensitivity": 0.8609747065272525 + }, + { + "name": "model.layers.18.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.406209761029459e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006257520872168243, + "sensitivity": 0.5862614305788391 + }, + { + "name": "model.layers.18.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.828587381984107e-05, + "sensitivity": 0.9519449352946373 + }, + { + "name": "model.layers.18.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.572740858246107e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00065939238993451, + "sensitivity": 0.5158423532486368 + }, + { + "name": "model.layers.18.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.609971049125306e-05, + "sensitivity": 0.8167990984267717 + }, + { + "name": "model.layers.18.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.20007414858992e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.509125185199082e-05, + "sensitivity": 0.7376413067146534 + }, + { + "name": "model.layers.18.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.940775736235082e-05, + "sensitivity": 0.8513860615820007 + }, + { + "name": "model.layers.18.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.860672551236348e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006573688006028533, + "sensitivity": 0.5500838737252949 + }, + { + "name": "model.layers.18.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.711413541575894e-05, + "sensitivity": 0.6928415657598016 + }, + { + "name": "model.layers.18.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.577610633939912e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006261933594942093, + "sensitivity": 0.5304496897894063 + }, + { + "name": "model.layers.18.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9911013522651047e-05, + "sensitivity": 0.9685396768412287 + }, + { + "name": "model.layers.18.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.591014312107291e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.054558252799325e-05, + "sensitivity": 0.7148080689063118 + }, + { + "name": "model.layers.18.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.290683010476641e-06, + "sensitivity": 1.4577627528632568 + }, + { + "name": "model.layers.18.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.395439757194254e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005845701089128852, + "sensitivity": 0.5648250793369446 + }, + { + "name": "model.layers.18.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.043287430657074e-05, + "sensitivity": 0.6412887838143002 + }, + { + "name": "model.layers.18.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.660185363216442e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006697532953694463, + "sensitivity": 0.5635214183676419 + }, + { + "name": "model.layers.18.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.571487756446004e-05, + "sensitivity": 0.7445277258687123 + }, + { + "name": "model.layers.18.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.585402161363163e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007525449618697166, + "sensitivity": 0.5265433985258016 + }, + { + "name": "model.layers.18.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.909112223889679e-05, + "sensitivity": 0.7901876704240491 + }, + { + "name": "model.layers.18.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.169098239501182e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006509320810437202, + "sensitivity": 0.5543123333190413 + }, + { + "name": "model.layers.18.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.894695641472936e-05, + "sensitivity": 0.96917918038664 + }, + { + "name": "model.layers.18.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.588190331058286e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006539045716635883, + "sensitivity": 0.5825980260566714 + }, + { + "name": "model.layers.18.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0869334801100194e-05, + "sensitivity": 1.2393846095289944 + }, + { + "name": "model.layers.18.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.01183887233492e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8889530919259414e-05, + "sensitivity": 0.6121964562604877 + }, + { + "name": "model.layers.18.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.468895298894495e-05, + "sensitivity": 0.6128540419506227 + }, + { + "name": "model.layers.18.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.528240075771464e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.478426803369075e-05, + "sensitivity": 0.6048557244950232 + }, + { + "name": "model.layers.18.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8650370192481205e-05, + "sensitivity": 0.6247889750291721 + }, + { + "name": "model.layers.18.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.643853680543543e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006457070121541619, + "sensitivity": 0.5417162388419479 + }, + { + "name": "model.layers.18.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6873905123211443e-05, + "sensitivity": 0.6064556502180046 + }, + { + "name": "model.layers.18.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.506510198458272e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006157317548058927, + "sensitivity": 0.540864845723175 + }, + { + "name": "model.layers.18.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1194555554538965e-05, + "sensitivity": 1.4448165309156729 + }, + { + "name": "model.layers.18.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.862867844072753e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.16025718045421e-05, + "sensitivity": 0.6007817280836287 + }, + { + "name": "model.layers.18.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0741776350187138e-05, + "sensitivity": 1.31863642277804 + }, + { + "name": "model.layers.18.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.825353011663537e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.077845081454143e-05, + "sensitivity": 1.3873834400804583 + }, + { + "name": "model.layers.18.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.586366751231253e-05, + "sensitivity": 1.0963588271794014 + }, + { + "name": "model.layers.18.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.272034056564735e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006295155035331845, + "sensitivity": 0.5594815997505217 + }, + { + "name": "model.layers.18.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.197067811328452e-06, + "sensitivity": 1.992892443254145 + }, + { + "name": "model.layers.18.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.621894842988695e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.028600571677089e-05, + "sensitivity": 0.6490427340392377 + }, + { + "name": "model.layers.18.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006872533122077584, + "sensitivity": 0.5491348209456268 + }, + { + "name": "model.layers.18.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.136735919426428e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006915683625265956, + "sensitivity": 0.5199439361852398 + }, + { + "name": "model.layers.18.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0277489309373777e-05, + "sensitivity": 1.8889414671389742 + }, + { + "name": "model.layers.18.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.731064440326008e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.530676571652293e-05, + "sensitivity": 0.727865579312458 + }, + { + "name": "model.layers.18.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.344218854792416e-05, + "sensitivity": 0.9913448328897938 + }, + { + "name": "model.layers.18.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.570662662852556e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007164551643654704, + "sensitivity": 0.5579995212603616 + }, + { + "name": "model.layers.18.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0033345461124554e-05, + "sensitivity": 1.3454417738520528 + }, + { + "name": "model.layers.18.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.598412258223107e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006325780414044857, + "sensitivity": 0.572077799423882 + }, + { + "name": "model.layers.18.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006393682560883462, + "sensitivity": 0.5628403439788878 + }, + { + "name": "model.layers.18.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0273363386659184e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006133638671599329, + "sensitivity": 0.5262693254632584 + }, + { + "name": "model.layers.18.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.090050136554055e-05, + "sensitivity": 1.4282971426629516 + }, + { + "name": "model.layers.18.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.286257641681004e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0455869970610365e-05, + "sensitivity": 0.76831631769947 + }, + { + "name": "model.layers.18.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.041878805262968e-05, + "sensitivity": 0.7840448570198159 + }, + { + "name": "model.layers.18.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.915379344718531e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006594274891540408, + "sensitivity": 0.5622263718441824 + }, + { + "name": "model.layers.18.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.720616536564194e-05, + "sensitivity": 0.8860686427366288 + }, + { + "name": "model.layers.18.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.56255451758625e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006297365762293339, + "sensitivity": 0.5238387137732312 + }, + { + "name": "model.layers.18.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.972495273454115e-05, + "sensitivity": 0.6619986584914582 + }, + { + "name": "model.layers.18.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.812341553086299e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006689619622193277, + "sensitivity": 0.5740431880616034 + }, + { + "name": "model.layers.18.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.004161822493188e-05, + "sensitivity": 1.6872062508261338 + }, + { + "name": "model.layers.18.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0078637160404469e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5902964959386736e-05, + "sensitivity": 0.8143149044527186 + }, + { + "name": "model.layers.18.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8473480748943985e-05, + "sensitivity": 0.8741074547308023 + }, + { + "name": "model.layers.18.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.632043323406833e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006402199505828321, + "sensitivity": 0.5236312940989641 + }, + { + "name": "model.layers.18.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000685560517013073, + "sensitivity": 0.5448568300953934 + }, + { + "name": "model.layers.18.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.878816520838882e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006672485615126789, + "sensitivity": 0.5609565789796327 + }, + { + "name": "model.layers.18.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.734939986723475e-05, + "sensitivity": 1.1768944530365477 + }, + { + "name": "model.layers.18.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.826556955275009e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.797428821097128e-05, + "sensitivity": 0.9542206857208423 + }, + { + "name": "model.layers.18.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006780046387575567, + "sensitivity": 0.5419885667435584 + }, + { + "name": "model.layers.18.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.192631190060638e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006906039780005813, + "sensitivity": 0.5287099810273603 + }, + { + "name": "model.layers.18.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 4.257918590155896e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.351557668589521e-06, + "sensitivity": 2.1001130731669697 + }, + { + "name": "model.layers.18.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.562369208040764e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.18.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.763187128744903e-06, + "sensitivity": 2.1043345314663116 + }, + { + "name": "model.layers.18.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 2.7376900106901303e-05, + "sensitivity": 1.748111329280677 + }, + { + "name": "model.layers.18.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00018819123215507716, + "sensitivity": 0.939685310589093 + }, + { + "name": "model.layers.18.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.4522366655000951e-05, + "sensitivity": 1.4164708630351979 + }, + { + "name": "model.layers.18.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 6.193553417688236e-05, + "sensitivity": 0.8128216660411776 + }, + { + "name": "model.layers.18.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00026967673329636455, + "sensitivity": 0.8376330955839231 + }, + { + "name": "model.layers.19.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.876152863493189e-05, + "sensitivity": 0.9368657139138483 + }, + { + "name": "model.layers.19.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.310688374673191e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006349773029796779, + "sensitivity": 0.5270105783285124 + }, + { + "name": "model.layers.19.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.259953806875274e-05, + "sensitivity": 0.8309648218957209 + }, + { + "name": "model.layers.19.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.041017167670361e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000707445084117353, + "sensitivity": 0.5697585547036377 + }, + { + "name": "model.layers.19.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1552239811862819e-05, + "sensitivity": 1.9940469018311662 + }, + { + "name": "model.layers.19.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.059434435381263e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007168753072619438, + "sensitivity": 0.5855177099166555 + }, + { + "name": "model.layers.19.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.877359944861382e-05, + "sensitivity": 0.8317974205649971 + }, + { + "name": "model.layers.19.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.268306833590032e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006605886737816036, + "sensitivity": 0.5294591891768197 + }, + { + "name": "model.layers.19.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.942988718743436e-05, + "sensitivity": 0.7317001785306171 + }, + { + "name": "model.layers.19.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.702496986894403e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006537871668115258, + "sensitivity": 0.5614494155288321 + }, + { + "name": "model.layers.19.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7493285567034036e-05, + "sensitivity": 0.74912740993433 + }, + { + "name": "model.layers.19.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.849329222153756e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006556273438036442, + "sensitivity": 0.5169610193034113 + }, + { + "name": "model.layers.19.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.11172872595489e-05, + "sensitivity": 1.0240929741990898 + }, + { + "name": "model.layers.19.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.864110559945402e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007101434166543186, + "sensitivity": 0.5668135204597028 + }, + { + "name": "model.layers.19.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0779192962218076e-05, + "sensitivity": 1.3815098479254246 + }, + { + "name": "model.layers.19.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.660407052549999e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000644977088086307, + "sensitivity": 0.5246232033408615 + }, + { + "name": "model.layers.19.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.016890984028578e-05, + "sensitivity": 0.8749706893868465 + }, + { + "name": "model.layers.19.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.213451469084248e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006543492199853063, + "sensitivity": 0.5464301223789266 + }, + { + "name": "model.layers.19.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1416795132390689e-05, + "sensitivity": 1.3399636240782893 + }, + { + "name": "model.layers.19.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.445188430210692e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007023645448498428, + "sensitivity": 0.5562947351959591 + }, + { + "name": "model.layers.19.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.57997588859871e-05, + "sensitivity": 0.7067773016060271 + }, + { + "name": "model.layers.19.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.104636322059378e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007509188144467771, + "sensitivity": 0.5439033586991099 + }, + { + "name": "model.layers.19.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9385925851529464e-05, + "sensitivity": 0.8603636076457223 + }, + { + "name": "model.layers.19.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.483292054326739e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006425100727938116, + "sensitivity": 0.5483396439029959 + }, + { + "name": "model.layers.19.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.850428715348244e-05, + "sensitivity": 0.917049505608442 + }, + { + "name": "model.layers.19.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.43550196805154e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006576854502782226, + "sensitivity": 0.5353209026079859 + }, + { + "name": "model.layers.19.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9805977798532695e-05, + "sensitivity": 0.7073645233342587 + }, + { + "name": "model.layers.19.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.104859266997664e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006434014067053795, + "sensitivity": 0.5136237217934313 + }, + { + "name": "model.layers.19.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.790881550638005e-05, + "sensitivity": 0.6746842164845195 + }, + { + "name": "model.layers.19.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.669226190249901e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006430658977478743, + "sensitivity": 0.5316611349241777 + }, + { + "name": "model.layers.19.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1670016647258308e-05, + "sensitivity": 1.4198787003951607 + }, + { + "name": "model.layers.19.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.171982699423097e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9268564655212685e-05, + "sensitivity": 1.1612546878941197 + }, + { + "name": "model.layers.19.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.410056084860116e-05, + "sensitivity": 1.1977430586384112 + }, + { + "name": "model.layers.19.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.534887688758317e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.193156877998263e-05, + "sensitivity": 0.6426313137038404 + }, + { + "name": "model.layers.19.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0938560990325641e-05, + "sensitivity": 1.5229179097209378 + }, + { + "name": "model.layers.19.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.414420568034984e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006432022200897336, + "sensitivity": 0.5540096741732735 + }, + { + "name": "model.layers.19.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1358623851265293e-05, + "sensitivity": 1.3514023818537826 + }, + { + "name": "model.layers.19.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.265703061420936e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.020099681336433e-05, + "sensitivity": 0.6881783824875676 + }, + { + "name": "model.layers.19.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9370500821387395e-05, + "sensitivity": 1.000517065076244 + }, + { + "name": "model.layers.19.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.684481827003765e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7954057410825044e-05, + "sensitivity": 0.7661674736962873 + }, + { + "name": "model.layers.19.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.829852307215333e-05, + "sensitivity": 0.7800568850120693 + }, + { + "name": "model.layers.19.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.891523642276297e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006413793889805675, + "sensitivity": 0.5273246737813941 + }, + { + "name": "model.layers.19.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.03534748632228e-05, + "sensitivity": 1.237982908836851 + }, + { + "name": "model.layers.19.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.749897127316217e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006312556797638535, + "sensitivity": 0.5214923819024371 + }, + { + "name": "model.layers.19.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9394555137259886e-05, + "sensitivity": 0.6022237444304146 + }, + { + "name": "model.layers.19.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.282489491444721e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000661953235976398, + "sensitivity": 0.5213066511546013 + }, + { + "name": "model.layers.19.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0869973822264e-05, + "sensitivity": 0.965217678933039 + }, + { + "name": "model.layers.19.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.181866183396778e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.991503348923288e-05, + "sensitivity": 0.7317969912218751 + }, + { + "name": "model.layers.19.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0501854022732005e-05, + "sensitivity": 0.6333966674190391 + }, + { + "name": "model.layers.19.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.728493756076205e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006635775207541883, + "sensitivity": 0.5422034039721404 + }, + { + "name": "model.layers.19.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1186511073901784e-05, + "sensitivity": 1.5852904173513238 + }, + { + "name": "model.layers.19.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.229607490444323e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006725361454300582, + "sensitivity": 0.5521411792781745 + }, + { + "name": "model.layers.19.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0126621974632144e-05, + "sensitivity": 0.7493393007724858 + }, + { + "name": "model.layers.19.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.61504770960164e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006824489100836217, + "sensitivity": 0.5163088920234953 + }, + { + "name": "model.layers.19.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006555861327797174, + "sensitivity": 0.5185057049699867 + }, + { + "name": "model.layers.19.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.237295219259977e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006527978694066405, + "sensitivity": 0.5649147913536021 + }, + { + "name": "model.layers.19.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.648800187278539e-06, + "sensitivity": 1.5248140186814423 + }, + { + "name": "model.layers.19.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.416620751930168e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.0684320740401745e-05, + "sensitivity": 1.1521271074738644 + }, + { + "name": "model.layers.19.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.046374200086575e-05, + "sensitivity": 1.2983556341420088 + }, + { + "name": "model.layers.19.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.616221751050034e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006142151542007923, + "sensitivity": 0.532298515853381 + }, + { + "name": "model.layers.19.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1996706234640442e-05, + "sensitivity": 1.409989136042963 + }, + { + "name": "model.layers.19.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.979807949392125e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000729390827473253, + "sensitivity": 0.5574213863237296 + }, + { + "name": "model.layers.19.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7058838137891144e-05, + "sensitivity": 1.0910861709878656 + }, + { + "name": "model.layers.19.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.890665531500417e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006176017923280597, + "sensitivity": 0.543391802687166 + }, + { + "name": "model.layers.19.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.495629011420533e-05, + "sensitivity": 0.9440054367767609 + }, + { + "name": "model.layers.19.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.688152100447041e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006264374824240804, + "sensitivity": 0.5060698892120897 + }, + { + "name": "model.layers.19.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.08495574851986e-05, + "sensitivity": 0.865017073203918 + }, + { + "name": "model.layers.19.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.289267275860766e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9303354646544904e-05, + "sensitivity": 0.61350072645335 + }, + { + "name": "model.layers.19.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.007466436130926e-05, + "sensitivity": 0.7315432443963399 + }, + { + "name": "model.layers.19.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.146688290049497e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006752772023901343, + "sensitivity": 0.5580532278967869 + }, + { + "name": "model.layers.19.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.98758969217306e-06, + "sensitivity": 1.7948311737252942 + }, + { + "name": "model.layers.19.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.500371109221305e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.4121570428833365e-05, + "sensitivity": 0.806940336370173 + }, + { + "name": "model.layers.19.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.898196104681119e-05, + "sensitivity": 1.0253559648879715 + }, + { + "name": "model.layers.19.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.180082093327655e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006347540183924139, + "sensitivity": 0.5678225359521688 + }, + { + "name": "model.layers.19.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.86785827181302e-05, + "sensitivity": 0.7884680195882199 + }, + { + "name": "model.layers.19.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.320281494889059e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006497708964161575, + "sensitivity": 0.5132727013943641 + }, + { + "name": "model.layers.19.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0107657191110775e-05, + "sensitivity": 0.9028489549481789 + }, + { + "name": "model.layers.19.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.533018108711985e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006651212461292744, + "sensitivity": 0.5272881597419466 + }, + { + "name": "model.layers.19.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.000467692501843e-05, + "sensitivity": 0.7962600343848137 + }, + { + "name": "model.layers.19.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.978726562716474e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006556756561622024, + "sensitivity": 0.528546177834924 + }, + { + "name": "model.layers.19.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.531976396217942e-05, + "sensitivity": 0.7945056822522613 + }, + { + "name": "model.layers.19.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.429080142173916e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007344274781644344, + "sensitivity": 0.5998834423806344 + }, + { + "name": "model.layers.19.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0258127632550895e-05, + "sensitivity": 1.0351481610543374 + }, + { + "name": "model.layers.19.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.659463676645828e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0643091273959726e-05, + "sensitivity": 0.6642043776674201 + }, + { + "name": "model.layers.19.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.287489668466151e-05, + "sensitivity": 0.7697996550016973 + }, + { + "name": "model.layers.19.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.583856813653256e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007254955125972629, + "sensitivity": 0.5336876911035394 + }, + { + "name": "model.layers.19.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.844206942943856e-06, + "sensitivity": 1.2026372358492396 + }, + { + "name": "model.layers.19.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1747588359867223e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 9.470925760979299e-06, + "sensitivity": 1.2443409414190048 + }, + { + "name": "model.layers.19.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0849811587831937e-05, + "sensitivity": 1.372281356271063 + }, + { + "name": "model.layers.19.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.605294965491339e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.829457950312644e-05, + "sensitivity": 0.8463575006522699 + }, + { + "name": "model.layers.19.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.615096208406612e-05, + "sensitivity": 0.6683099975122065 + }, + { + "name": "model.layers.19.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.04539615981048e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007404100033454597, + "sensitivity": 0.5775761645867791 + }, + { + "name": "model.layers.19.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9947829868178815e-05, + "sensitivity": 0.833319800020328 + }, + { + "name": "model.layers.19.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.96244443993055e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6680852139834315e-05, + "sensitivity": 0.6161824330517606 + }, + { + "name": "model.layers.19.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.2359560059849173e-05, + "sensitivity": 1.6926097357846164 + }, + { + "name": "model.layers.19.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.683429430471733e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.319249223452061e-05, + "sensitivity": 1.0520214437640174 + }, + { + "name": "model.layers.19.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0833906344487332e-05, + "sensitivity": 1.2135509357842302 + }, + { + "name": "model.layers.19.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.809052249285742e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006605993257835507, + "sensitivity": 0.5455926154489663 + }, + { + "name": "model.layers.19.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.747075192630291e-05, + "sensitivity": 0.7130982560577908 + }, + { + "name": "model.layers.19.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.498507332253212e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000653569120913744, + "sensitivity": 0.548043846657554 + }, + { + "name": "model.layers.19.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6294411479029804e-05, + "sensitivity": 0.9590650951367612 + }, + { + "name": "model.layers.19.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.248493597624474e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.4627111239824444e-05, + "sensitivity": 0.6513163519566365 + }, + { + "name": "model.layers.19.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.134665944846347e-05, + "sensitivity": 1.3315920161631412 + }, + { + "name": "model.layers.19.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.053348796631326e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007221802952699363, + "sensitivity": 0.5895840052086339 + }, + { + "name": "model.layers.19.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.741901622968726e-05, + "sensitivity": 0.7645136066760989 + }, + { + "name": "model.layers.19.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.351462383870967e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006328622112050653, + "sensitivity": 0.5461907344128292 + }, + { + "name": "model.layers.19.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.404653347795829e-05, + "sensitivity": 1.179558587592771 + }, + { + "name": "model.layers.19.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.664168831273855e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.427856740425341e-05, + "sensitivity": 0.6141391982924809 + }, + { + "name": "model.layers.19.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7651424867799506e-05, + "sensitivity": 0.7277730013884077 + }, + { + "name": "model.layers.19.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0248520538880257e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006189779378473759, + "sensitivity": 0.5697858442907295 + }, + { + "name": "model.layers.19.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0931367796729319e-05, + "sensitivity": 1.4032921112624044 + }, + { + "name": "model.layers.19.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.094611535445438e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000666033651214093, + "sensitivity": 0.5420334555032834 + }, + { + "name": "model.layers.19.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.884556958335452e-05, + "sensitivity": 1.0708581382907387 + }, + { + "name": "model.layers.19.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.483180072791583e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006568226963281631, + "sensitivity": 0.536442410387929 + }, + { + "name": "model.layers.19.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.833373870700598e-05, + "sensitivity": 1.015433603172787 + }, + { + "name": "model.layers.19.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.138424737400783e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006581383058801293, + "sensitivity": 0.5304815211887368 + }, + { + "name": "model.layers.19.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0427773860283196e-05, + "sensitivity": 0.9364708316005375 + }, + { + "name": "model.layers.19.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.87486021888617e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006520829047076404, + "sensitivity": 0.5654456146318855 + }, + { + "name": "model.layers.19.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.1925652617937885e-06, + "sensitivity": 2.0972786766816274 + }, + { + "name": "model.layers.19.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.89389355052117e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.375222099246457e-05, + "sensitivity": 0.6475168023822913 + }, + { + "name": "model.layers.19.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8241388614987954e-05, + "sensitivity": 1.0682038408475387 + }, + { + "name": "model.layers.19.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.678812158294022e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006347006419673562, + "sensitivity": 0.5723633529378053 + }, + { + "name": "model.layers.19.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.98369151703082e-05, + "sensitivity": 0.6645464671032554 + }, + { + "name": "model.layers.19.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.031452125578653e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006706027197651565, + "sensitivity": 0.5517007175599339 + }, + { + "name": "model.layers.19.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006556607550010085, + "sensitivity": 0.5512331352882991 + }, + { + "name": "model.layers.19.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.89728870181716e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006292978650890291, + "sensitivity": 0.525099748941682 + }, + { + "name": "model.layers.19.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.029702126397751e-05, + "sensitivity": 0.9656435215990208 + }, + { + "name": "model.layers.19.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.664469651695981e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006722956895828247, + "sensitivity": 0.557957691165478 + }, + { + "name": "model.layers.19.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 4.0031973185250536e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3383036023005843e-06, + "sensitivity": 2.099834170023734 + }, + { + "name": "model.layers.19.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.417579925255268e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.19.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 7.790118615957908e-06, + "sensitivity": 1.386085282875864 + }, + { + "name": "model.layers.19.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 3.192814256181009e-05, + "sensitivity": 1.9421012090134682 + }, + { + "name": "model.layers.19.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00018077378626912832, + "sensitivity": 1.0690458319870662 + }, + { + "name": "model.layers.19.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.643800896999892e-05, + "sensitivity": 1.258131320190985 + }, + { + "name": "model.layers.19.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 2, + "mse": 0.0006832742947153747, + "sensitivity": 0.5504496310558208 + }, + { + "name": "model.layers.19.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002673773851711303, + "sensitivity": 0.7335318994903526 + }, + { + "name": "model.layers.20.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.961624265182763e-05, + "sensitivity": 1.1916419808917444 + }, + { + "name": "model.layers.20.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.023475288609916e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000653678725939244, + "sensitivity": 0.5454899039390482 + }, + { + "name": "model.layers.20.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007260659476742148, + "sensitivity": 0.558578567938649 + }, + { + "name": "model.layers.20.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.65069535443763e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006928014336153865, + "sensitivity": 0.5619652476146978 + }, + { + "name": "model.layers.20.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.731965939048678e-05, + "sensitivity": 0.8083513440873115 + }, + { + "name": "model.layers.20.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.098125027165224e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006385261658579111, + "sensitivity": 0.5155225274504436 + }, + { + "name": "model.layers.20.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.111292168498039e-05, + "sensitivity": 0.7800007594133374 + }, + { + "name": "model.layers.20.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0853761978069087e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006966580986045301, + "sensitivity": 0.5938431191585292 + }, + { + "name": "model.layers.20.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.28968991804868e-05, + "sensitivity": 1.094395647017167 + }, + { + "name": "model.layers.20.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.894449254308711e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006917395512573421, + "sensitivity": 0.5802581662989211 + }, + { + "name": "model.layers.20.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.997137850499712e-05, + "sensitivity": 0.8147287335770342 + }, + { + "name": "model.layers.20.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.072899623177364e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006632154108956456, + "sensitivity": 0.5266012694026626 + }, + { + "name": "model.layers.20.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.024046888342127e-05, + "sensitivity": 0.621071143835717 + }, + { + "name": "model.layers.20.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.984358833506121e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006495471461676061, + "sensitivity": 0.5454412458445417 + }, + { + "name": "model.layers.20.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1901624020538293e-05, + "sensitivity": 1.2660654527481943 + }, + { + "name": "model.layers.20.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.73505405504693e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007166418945416808, + "sensitivity": 0.5473248265596455 + }, + { + "name": "model.layers.20.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.896115180803463e-05, + "sensitivity": 0.9732723633923882 + }, + { + "name": "model.layers.20.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.084046723728534e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006447415798902512, + "sensitivity": 0.5699147117777952 + }, + { + "name": "model.layers.20.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.380700506269932e-05, + "sensitivity": 0.7754000973915249 + }, + { + "name": "model.layers.20.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.505779310828075e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007014956208877265, + "sensitivity": 0.5447520914846815 + }, + { + "name": "model.layers.20.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1279113095952198e-05, + "sensitivity": 1.3353169363381971 + }, + { + "name": "model.layers.20.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.66623247222742e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00068761280272156, + "sensitivity": 0.5587166741328682 + }, + { + "name": "model.layers.20.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1129122867714614e-05, + "sensitivity": 1.362740400456367 + }, + { + "name": "model.layers.20.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.079289960325696e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006673883181065321, + "sensitivity": 0.5735166742662103 + }, + { + "name": "model.layers.20.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0410891263745725e-05, + "sensitivity": 1.572998315131814 + }, + { + "name": "model.layers.20.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.779949105999549e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006365698645822704, + "sensitivity": 0.5785869438462765 + }, + { + "name": "model.layers.20.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.821452214149758e-05, + "sensitivity": 0.7819496616151946 + }, + { + "name": "model.layers.20.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.246266816058778e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.634051558445208e-05, + "sensitivity": 0.6834350239893332 + }, + { + "name": "model.layers.20.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.642544056172483e-05, + "sensitivity": 1.1578293132151791 + }, + { + "name": "model.layers.20.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.620047431875719e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.466632865136489e-05, + "sensitivity": 0.9142775563345338 + }, + { + "name": "model.layers.20.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.207567639648914e-05, + "sensitivity": 1.0139544612624622 + }, + { + "name": "model.layers.20.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.489703991974238e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007027639076113701, + "sensitivity": 0.5763819346659312 + }, + { + "name": "model.layers.20.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.33366871625185e-05, + "sensitivity": 0.7636777835754364 + }, + { + "name": "model.layers.20.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.137062081914337e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007067638216540217, + "sensitivity": 0.560823282249965 + }, + { + "name": "model.layers.20.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.233137537492439e-05, + "sensitivity": 1.127482327769577 + }, + { + "name": "model.layers.20.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.131464260761277e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000672479160130024, + "sensitivity": 0.563138616987967 + }, + { + "name": "model.layers.20.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.2768135750084184e-06, + "sensitivity": 2.0112249942968745 + }, + { + "name": "model.layers.20.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.651580406469293e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.230555689195171e-05, + "sensitivity": 0.9631153478214038 + }, + { + "name": "model.layers.20.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0674742043192964e-05, + "sensitivity": 1.2206043971814293 + }, + { + "name": "model.layers.20.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.995870537844894e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006441769655793905, + "sensitivity": 0.5460091414469681 + }, + { + "name": "model.layers.20.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.538719753734767e-05, + "sensitivity": 1.053729067020045 + }, + { + "name": "model.layers.20.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.265975341397279e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.419725104933605e-05, + "sensitivity": 0.614372991475755 + }, + { + "name": "model.layers.20.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.959677218925208e-05, + "sensitivity": 1.027089020236314 + }, + { + "name": "model.layers.20.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.246784884453518e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006592316785827279, + "sensitivity": 0.5521797051275956 + }, + { + "name": "model.layers.20.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.308910087682307e-05, + "sensitivity": 0.9248132098272854 + }, + { + "name": "model.layers.20.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.302560334210284e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.142591882962734e-05, + "sensitivity": 0.637414335902284 + }, + { + "name": "model.layers.20.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1367227671144065e-05, + "sensitivity": 1.8346651201542072 + }, + { + "name": "model.layers.20.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.400272122344177e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.208679405972362e-05, + "sensitivity": 0.6651005247440128 + }, + { + "name": "model.layers.20.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.102721034840215e-05, + "sensitivity": 1.5244497404667137 + }, + { + "name": "model.layers.20.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.961745384614915e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9643934946507215e-05, + "sensitivity": 0.695110920857563 + }, + { + "name": "model.layers.20.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1616614756349009e-05, + "sensitivity": 1.390316483217166 + }, + { + "name": "model.layers.20.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.207851240309537e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006977186421863735, + "sensitivity": 0.5334477169753207 + }, + { + "name": "model.layers.20.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.207222759258002e-05, + "sensitivity": 0.8834528181524062 + }, + { + "name": "model.layers.20.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.692844974371837e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006551377009600401, + "sensitivity": 0.5788208403768159 + }, + { + "name": "model.layers.20.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1329204426147044e-05, + "sensitivity": 1.2888320183054887 + }, + { + "name": "model.layers.20.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.889672583085485e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.1504132999107242e-05, + "sensitivity": 1.5431553725436902 + }, + { + "name": "model.layers.20.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.740686901845038e-05, + "sensitivity": 1.1837355224122694 + }, + { + "name": "model.layers.20.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.184998824210197e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6090513680828735e-05, + "sensitivity": 0.6873437541620037 + }, + { + "name": "model.layers.20.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.046454235620331e-05, + "sensitivity": 1.6128239070207657 + }, + { + "name": "model.layers.20.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.744840336774359e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5701144447084516e-05, + "sensitivity": 0.6123968877190555 + }, + { + "name": "model.layers.20.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0920501154032536e-05, + "sensitivity": 1.620761244475798 + }, + { + "name": "model.layers.20.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.075031251384644e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006550023099407554, + "sensitivity": 0.5649350499684704 + }, + { + "name": "model.layers.20.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.172854773467407e-05, + "sensitivity": 1.1586999967765297 + }, + { + "name": "model.layers.20.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.649045983271208e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006698516081087291, + "sensitivity": 0.5922356645552063 + }, + { + "name": "model.layers.20.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.19320198893547e-05, + "sensitivity": 0.8493296410244968 + }, + { + "name": "model.layers.20.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.401502901098866e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006774346111342311, + "sensitivity": 0.5717505990487768 + }, + { + "name": "model.layers.20.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.588730320800096e-05, + "sensitivity": 1.1546306379737472 + }, + { + "name": "model.layers.20.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.814826060188352e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.806179590057582e-05, + "sensitivity": 0.9701636485703039 + }, + { + "name": "model.layers.20.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0848245437955484e-05, + "sensitivity": 1.819937022744789 + }, + { + "name": "model.layers.20.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.056972097212565e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.738443724112585e-05, + "sensitivity": 0.6192220301851763 + }, + { + "name": "model.layers.20.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.027605559211224e-05, + "sensitivity": 0.9054179887435536 + }, + { + "name": "model.layers.20.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.192144835244108e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006684227264486253, + "sensitivity": 0.5382310001134892 + }, + { + "name": "model.layers.20.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1007088687620126e-05, + "sensitivity": 1.7554986195726427 + }, + { + "name": "model.layers.20.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.19981392446789e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006586122326552868, + "sensitivity": 0.5944542380048052 + }, + { + "name": "model.layers.20.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0377259968663566e-05, + "sensitivity": 1.2745752563793746 + }, + { + "name": "model.layers.20.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.380104196068714e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006331743206828833, + "sensitivity": 0.5394281888333716 + }, + { + "name": "model.layers.20.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.683744140900671e-05, + "sensitivity": 0.9976576812085537 + }, + { + "name": "model.layers.20.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.427003652082931e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007456554449163377, + "sensitivity": 0.5582909850495396 + }, + { + "name": "model.layers.20.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0279762136633508e-05, + "sensitivity": 1.477514274928815 + }, + { + "name": "model.layers.20.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.367549864691682e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5681255616946146e-05, + "sensitivity": 0.7416347049486325 + }, + { + "name": "model.layers.20.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.66761989123188e-05, + "sensitivity": 0.9848148761165249 + }, + { + "name": "model.layers.20.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.466067017958267e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007716318359598517, + "sensitivity": 0.558240680385377 + }, + { + "name": "model.layers.20.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.949829937890172e-05, + "sensitivity": 0.905795314002399 + }, + { + "name": "model.layers.20.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.631507514815894e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000659218174405396, + "sensitivity": 0.5306706047995501 + }, + { + "name": "model.layers.20.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.127789674792439e-05, + "sensitivity": 1.0301379235554617 + }, + { + "name": "model.layers.20.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.736122592585161e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006708709406666458, + "sensitivity": 0.5484715766211175 + }, + { + "name": "model.layers.20.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.70923909638077e-05, + "sensitivity": 0.9241821580671827 + }, + { + "name": "model.layers.20.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.978014420790714e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.763505371054634e-05, + "sensitivity": 0.8807684402131044 + }, + { + "name": "model.layers.20.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.050448791938834e-05, + "sensitivity": 0.8679977555904304 + }, + { + "name": "model.layers.20.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.544666462104942e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006482892786152661, + "sensitivity": 0.570132743848603 + }, + { + "name": "model.layers.20.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.381754064932466e-05, + "sensitivity": 0.9543989653470197 + }, + { + "name": "model.layers.20.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.033422318476369e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006927655776962638, + "sensitivity": 0.5465341664004278 + }, + { + "name": "model.layers.20.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0581162314338144e-05, + "sensitivity": 1.712146219629282 + }, + { + "name": "model.layers.20.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.420850801689085e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.0253881555399857e-05, + "sensitivity": 1.550776928042143 + }, + { + "name": "model.layers.20.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.031189695931971e-05, + "sensitivity": 0.9216292772220124 + }, + { + "name": "model.layers.20.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.000300570325635e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006763345445506275, + "sensitivity": 0.5475465354076753 + }, + { + "name": "model.layers.20.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.472907261922956e-05, + "sensitivity": 0.8547923224195489 + }, + { + "name": "model.layers.20.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.879174065943516e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006940357270650566, + "sensitivity": 0.5636609558215082 + }, + { + "name": "model.layers.20.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1034686394850723e-05, + "sensitivity": 1.3709432762271838 + }, + { + "name": "model.layers.20.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.199471727086348e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006840967107564211, + "sensitivity": 0.5928577602703559 + }, + { + "name": "model.layers.20.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0009224398527294e-05, + "sensitivity": 0.9343061735791691 + }, + { + "name": "model.layers.20.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.999666197771148e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006848049233667552, + "sensitivity": 0.5339999918743596 + }, + { + "name": "model.layers.20.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0380710591562092e-05, + "sensitivity": 1.3355791098210417 + }, + { + "name": "model.layers.20.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.913892096032214e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.687677185051143e-05, + "sensitivity": 0.8344424737458406 + }, + { + "name": "model.layers.20.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.2030905054416507e-05, + "sensitivity": 1.372299701064696 + }, + { + "name": "model.layers.20.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.529755521318293e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007453722646459937, + "sensitivity": 0.542862276386131 + }, + { + "name": "model.layers.20.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.866892752237618e-05, + "sensitivity": 0.7536253260902532 + }, + { + "name": "model.layers.20.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.079810870891379e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006729393498972058, + "sensitivity": 0.5919462851701527 + }, + { + "name": "model.layers.20.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.586630479432642e-05, + "sensitivity": 1.1753121405955858 + }, + { + "name": "model.layers.20.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1028976132365642e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.735823990311474e-05, + "sensitivity": 0.6074948195154166 + }, + { + "name": "model.layers.20.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0839878086699173e-05, + "sensitivity": 1.276936828094001 + }, + { + "name": "model.layers.20.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.775577847089153e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006449393695220351, + "sensitivity": 0.5160687124382078 + }, + { + "name": "model.layers.20.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0283423762302846e-05, + "sensitivity": 1.3334902539381457 + }, + { + "name": "model.layers.20.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.314206863564323e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006283309776335955, + "sensitivity": 0.5997061915728015 + }, + { + "name": "model.layers.20.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.033540557837114e-05, + "sensitivity": 0.7628965819978677 + }, + { + "name": "model.layers.20.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.498334528259875e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006860859575681388, + "sensitivity": 0.5043214022280578 + }, + { + "name": "model.layers.20.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0406653018435463e-05, + "sensitivity": 1.9796778402191213 + }, + { + "name": "model.layers.20.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.502517291868571e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.616348789772019e-05, + "sensitivity": 1.1078518719400512 + }, + { + "name": "model.layers.20.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.542096449877135e-06, + "sensitivity": 1.7564646766345273 + }, + { + "name": "model.layers.20.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.519221986105549e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.0778500735759735e-05, + "sensitivity": 0.9458449278470007 + }, + { + "name": "model.layers.20.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.372154166456312e-05, + "sensitivity": 0.990856333627188 + }, + { + "name": "model.layers.20.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.570590921408439e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.435949762817472e-05, + "sensitivity": 0.734999072091588 + }, + { + "name": "model.layers.20.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.672129918821156e-05, + "sensitivity": 0.9204653334196655 + }, + { + "name": "model.layers.20.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0373216809966834e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006376021774485707, + "sensitivity": 0.5604044189238739 + }, + { + "name": "model.layers.20.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1420552255003713e-05, + "sensitivity": 1.4456218373715932 + }, + { + "name": "model.layers.20.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.444972993653209e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006774680223315954, + "sensitivity": 0.5310657656391488 + }, + { + "name": "model.layers.20.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0526945162564516e-05, + "sensitivity": 1.0166908052597403 + }, + { + "name": "model.layers.20.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.331118692694872e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006412116345018148, + "sensitivity": 0.5425306412546711 + }, + { + "name": "model.layers.20.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 4.22104176323046e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4972766823339043e-06, + "sensitivity": 2.101144466001612 + }, + { + "name": "model.layers.20.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.738845286236028e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.20.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 8.260114555014297e-06, + "sensitivity": 1.7497824349980893 + }, + { + "name": "model.layers.20.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 6.9907564466120675e-06, + "sensitivity": 2.0597086861660436 + }, + { + "name": "model.layers.20.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00020233738177921623, + "sensitivity": 1.0101991886306045 + }, + { + "name": "model.layers.20.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.454328048566822e-05, + "sensitivity": 1.4035260193678885 + }, + { + "name": "model.layers.20.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.8794459619093686e-05, + "sensitivity": 0.6302626247618112 + }, + { + "name": "model.layers.20.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0003008406492881477, + "sensitivity": 0.825203343686161 + }, + { + "name": "model.layers.21.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.470707012340426e-05, + "sensitivity": 1.1405754990494357 + }, + { + "name": "model.layers.21.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.869817070764839e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00071334297535941, + "sensitivity": 0.5277189655509682 + }, + { + "name": "model.layers.21.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.145892984932289e-05, + "sensitivity": 0.8981685082232558 + }, + { + "name": "model.layers.21.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.423890338031924e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006810436025261879, + "sensitivity": 0.5441798069500908 + }, + { + "name": "model.layers.21.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9178313676966354e-05, + "sensitivity": 0.6322503508803525 + }, + { + "name": "model.layers.21.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.45981276142993e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006666152039542794, + "sensitivity": 0.49616880216085524 + }, + { + "name": "model.layers.21.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4089061450213194e-05, + "sensitivity": 0.9503398868682165 + }, + { + "name": "model.layers.21.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.417047870854731e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005756285972893238, + "sensitivity": 0.5662198854708143 + }, + { + "name": "model.layers.21.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9239595429971814e-05, + "sensitivity": 1.181638438713063 + }, + { + "name": "model.layers.21.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.037862701508857e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006333107594400644, + "sensitivity": 0.5527928063399578 + }, + { + "name": "model.layers.21.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.065780088538304e-05, + "sensitivity": 1.5724684563124416 + }, + { + "name": "model.layers.21.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.729625164960453e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006192586151883006, + "sensitivity": 0.5613491564568702 + }, + { + "name": "model.layers.21.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.557505210163072e-05, + "sensitivity": 0.8746739087617841 + }, + { + "name": "model.layers.21.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.352805593858648e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005968051846139133, + "sensitivity": 0.5469736692587901 + }, + { + "name": "model.layers.21.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.704361294396222e-05, + "sensitivity": 1.0234870286173972 + }, + { + "name": "model.layers.21.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.47854187466146e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.475860573118553e-05, + "sensitivity": 1.0945644950246605 + }, + { + "name": "model.layers.21.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8123514463659376e-05, + "sensitivity": 0.8187532116792057 + }, + { + "name": "model.layers.21.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.156410219977261e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006469328654929996, + "sensitivity": 0.5270182753440417 + }, + { + "name": "model.layers.21.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0189176464336924e-05, + "sensitivity": 1.2672851248044037 + }, + { + "name": "model.layers.21.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.372174539137632e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006151500856503844, + "sensitivity": 0.5363336815226907 + }, + { + "name": "model.layers.21.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.137401214800775e-05, + "sensitivity": 0.9766061153983782 + }, + { + "name": "model.layers.21.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.607788686276763e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000670911162160337, + "sensitivity": 0.5338839562401135 + }, + { + "name": "model.layers.21.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.860920646227896e-05, + "sensitivity": 0.9593149572590405 + }, + { + "name": "model.layers.21.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.483195420514676e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006587253883481026, + "sensitivity": 0.5734096887531699 + }, + { + "name": "model.layers.21.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.882800542167388e-05, + "sensitivity": 0.6482169617977906 + }, + { + "name": "model.layers.21.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.061071750693372e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000619435915723443, + "sensitivity": 0.5225868773872941 + }, + { + "name": "model.layers.21.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.589374268311076e-05, + "sensitivity": 1.131786674100676 + }, + { + "name": "model.layers.21.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.98837697604904e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.0364199624746107e-05, + "sensitivity": 1.2095712247361128 + }, + { + "name": "model.layers.21.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.336133810691535e-05, + "sensitivity": 0.6485839395462321 + }, + { + "name": "model.layers.21.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.850230758776888e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006753271445631981, + "sensitivity": 0.5265299552694438 + }, + { + "name": "model.layers.21.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.934457294642925e-05, + "sensitivity": 0.8426853116919891 + }, + { + "name": "model.layers.21.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.76200386351411e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006494239205494523, + "sensitivity": 0.5330858177802806 + }, + { + "name": "model.layers.21.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0701416613301262e-05, + "sensitivity": 1.2495467924527464 + }, + { + "name": "model.layers.21.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.606962182966527e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006318545201793313, + "sensitivity": 0.5876133186381026 + }, + { + "name": "model.layers.21.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.879285163246095e-05, + "sensitivity": 0.8070965065733529 + }, + { + "name": "model.layers.21.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.428587878166582e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006257513887248933, + "sensitivity": 0.5357910339842388 + }, + { + "name": "model.layers.21.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0835396096808836e-05, + "sensitivity": 1.3922430188789718 + }, + { + "name": "model.layers.21.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.326366701614461e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000656719203107059, + "sensitivity": 0.5182769977667021 + }, + { + "name": "model.layers.21.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0884653066750616e-05, + "sensitivity": 0.8130134376217784 + }, + { + "name": "model.layers.21.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.99333554621262e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006487469072453678, + "sensitivity": 0.5774438552440821 + }, + { + "name": "model.layers.21.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.793773743789643e-05, + "sensitivity": 0.8275856461126941 + }, + { + "name": "model.layers.21.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.71174370584049e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000605597160756588, + "sensitivity": 0.5187332723226392 + }, + { + "name": "model.layers.21.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.370445771608502e-05, + "sensitivity": 0.6237224031778393 + }, + { + "name": "model.layers.21.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.00828126759734e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006917849532328546, + "sensitivity": 0.5523803057096908 + }, + { + "name": "model.layers.21.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0309324352419935e-05, + "sensitivity": 1.4048941215489588 + }, + { + "name": "model.layers.21.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.575747650254925e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006085638306103647, + "sensitivity": 0.5159564884975094 + }, + { + "name": "model.layers.21.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6270808272529393e-05, + "sensitivity": 0.8629456893193356 + }, + { + "name": "model.layers.21.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.869498747619218e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006053994875401258, + "sensitivity": 0.5243826231545688 + }, + { + "name": "model.layers.21.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7954381190938875e-05, + "sensitivity": 1.1802838393255397 + }, + { + "name": "model.layers.21.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.645947792094375e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006071124807931483, + "sensitivity": 0.4954425177365363 + }, + { + "name": "model.layers.21.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.430847871437436e-06, + "sensitivity": 2.0968226202249425 + }, + { + "name": "model.layers.21.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.344195639940153e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000664765015244484, + "sensitivity": 0.5337841621169286 + }, + { + "name": "model.layers.21.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1897648619196843e-05, + "sensitivity": 1.301363233344454 + }, + { + "name": "model.layers.21.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.632056847091008e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.358055543387309e-05, + "sensitivity": 0.8693081580805506 + }, + { + "name": "model.layers.21.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.635792669840157e-05, + "sensitivity": 0.6569584651703313 + }, + { + "name": "model.layers.21.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.294833039850346e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007257845136336982, + "sensitivity": 0.5357987850484229 + }, + { + "name": "model.layers.21.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.584775863098912e-05, + "sensitivity": 0.6107468723755627 + }, + { + "name": "model.layers.21.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.127850156190107e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006040145526640117, + "sensitivity": 0.5161898611115291 + }, + { + "name": "model.layers.21.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.553993443958461e-05, + "sensitivity": 0.6397581027143381 + }, + { + "name": "model.layers.21.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.74033389663964e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007216609083116055, + "sensitivity": 0.5211462688160122 + }, + { + "name": "model.layers.21.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.358297832775861e-05, + "sensitivity": 0.8215587668279092 + }, + { + "name": "model.layers.21.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.375008752002032e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.261604721657932e-05, + "sensitivity": 0.7148120926793915 + }, + { + "name": "model.layers.21.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.95935741532594e-05, + "sensitivity": 1.1524595037576861 + }, + { + "name": "model.layers.21.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.17182274456718e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007819534512236714, + "sensitivity": 0.5423164583934699 + }, + { + "name": "model.layers.21.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.883823541807942e-05, + "sensitivity": 0.6803150515668173 + }, + { + "name": "model.layers.21.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.72085582462023e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00063799147028476, + "sensitivity": 0.551994440533667 + }, + { + "name": "model.layers.21.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.195553634010139e-06, + "sensitivity": 2.0970824769479073 + }, + { + "name": "model.layers.21.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.672940233125701e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000590536103118211, + "sensitivity": 0.5198198146986255 + }, + { + "name": "model.layers.21.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.757307371823117e-05, + "sensitivity": 0.6360062981662613 + }, + { + "name": "model.layers.21.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1571207778615644e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006157857715152204, + "sensitivity": 0.5643761312959038 + }, + { + "name": "model.layers.21.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1914049537153915e-05, + "sensitivity": 1.6130534958913352 + }, + { + "name": "model.layers.21.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.289471568583394e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007349028019234538, + "sensitivity": 0.5355710078574176 + }, + { + "name": "model.layers.21.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.183538062032312e-05, + "sensitivity": 0.9234467734891907 + }, + { + "name": "model.layers.21.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.584716286146431e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006960986065678298, + "sensitivity": 0.5607702890469304 + }, + { + "name": "model.layers.21.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.890133616048843e-05, + "sensitivity": 0.8866689404702304 + }, + { + "name": "model.layers.21.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.730891411483753e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.465430149342865e-05, + "sensitivity": 0.6053900239414027 + }, + { + "name": "model.layers.21.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.849348963238299e-05, + "sensitivity": 0.6857072491240499 + }, + { + "name": "model.layers.21.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.906662181587308e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006367613095790148, + "sensitivity": 0.5140802155664165 + }, + { + "name": "model.layers.21.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.599655898753554e-05, + "sensitivity": 1.0034940597911512 + }, + { + "name": "model.layers.21.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.146254918348859e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.420408317353576e-05, + "sensitivity": 0.6600740954700368 + }, + { + "name": "model.layers.21.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6511118600610644e-05, + "sensitivity": 0.7222658021020516 + }, + { + "name": "model.layers.21.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.970707767730346e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5994569265749305e-05, + "sensitivity": 0.63260745308644 + }, + { + "name": "model.layers.21.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.826041888212785e-05, + "sensitivity": 0.9672263150114004 + }, + { + "name": "model.layers.21.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.385035243918537e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5761804105713964e-05, + "sensitivity": 0.6158916572846231 + }, + { + "name": "model.layers.21.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.10812712693587e-05, + "sensitivity": 1.0026139040159063 + }, + { + "name": "model.layers.21.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.617235612793593e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006627800757996738, + "sensitivity": 0.5406390792211939 + }, + { + "name": "model.layers.21.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000641274731606245, + "sensitivity": 0.5634387430241662 + }, + { + "name": "model.layers.21.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.933584586477082e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006220659706741571, + "sensitivity": 0.5250074927021652 + }, + { + "name": "model.layers.21.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6636483350303024e-05, + "sensitivity": 1.1109737555801247 + }, + { + "name": "model.layers.21.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.678537036146736e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006289500743150711, + "sensitivity": 0.531988322664145 + }, + { + "name": "model.layers.21.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9459525800775737e-05, + "sensitivity": 0.9117354680240873 + }, + { + "name": "model.layers.21.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.135742521313659e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006434587412513793, + "sensitivity": 0.549942426721354 + }, + { + "name": "model.layers.21.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8652683947002515e-05, + "sensitivity": 0.7680744627554967 + }, + { + "name": "model.layers.21.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.538255886174738e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.565858737099916e-05, + "sensitivity": 0.6276297241848575 + }, + { + "name": "model.layers.21.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9434572904137895e-05, + "sensitivity": 0.9284828392958464 + }, + { + "name": "model.layers.21.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.5544147648543e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006237897323444486, + "sensitivity": 0.5534648183721057 + }, + { + "name": "model.layers.21.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.54807809041813e-05, + "sensitivity": 0.8250748164600921 + }, + { + "name": "model.layers.21.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.711947773714201e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000730929896235466, + "sensitivity": 0.5464915360339504 + }, + { + "name": "model.layers.21.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0739082426880486e-05, + "sensitivity": 1.3276580275218854 + }, + { + "name": "model.layers.21.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.444740385333716e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.736047387472354e-05, + "sensitivity": 0.685787969705762 + }, + { + "name": "model.layers.21.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.489269096869975e-05, + "sensitivity": 0.6931987539767394 + }, + { + "name": "model.layers.21.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.986200903862482e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006049717194400728, + "sensitivity": 0.5132135174887917 + }, + { + "name": "model.layers.21.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.159242184367031e-05, + "sensitivity": 0.6712487122626843 + }, + { + "name": "model.layers.21.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.734593054919969e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9704754676204175e-05, + "sensitivity": 0.623061109610997 + }, + { + "name": "model.layers.21.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9615791542455554e-05, + "sensitivity": 0.7275653637179735 + }, + { + "name": "model.layers.21.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.111860895747668e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006256886990740895, + "sensitivity": 0.5256866760678321 + }, + { + "name": "model.layers.21.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.596443224931136e-05, + "sensitivity": 1.0126009794573219 + }, + { + "name": "model.layers.21.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.282928891072515e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006127101369202137, + "sensitivity": 0.5982327648013748 + }, + { + "name": "model.layers.21.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.682985364634078e-06, + "sensitivity": 1.2538070564459824 + }, + { + "name": "model.layers.21.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0650073818396777e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.24188217241317e-05, + "sensitivity": 0.6272980026541357 + }, + { + "name": "model.layers.21.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.700580368284136e-05, + "sensitivity": 0.8955829602496694 + }, + { + "name": "model.layers.21.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.966756700421683e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006296024657785892, + "sensitivity": 0.5352157491990078 + }, + { + "name": "model.layers.21.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.539047727623256e-06, + "sensitivity": 2.097609276374532 + }, + { + "name": "model.layers.21.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3108351595292334e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.636913556372747e-05, + "sensitivity": 0.9781671104935199 + }, + { + "name": "model.layers.21.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.356221274472773e-05, + "sensitivity": 0.8491077840274295 + }, + { + "name": "model.layers.21.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.405703286167409e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006949134403839707, + "sensitivity": 0.52600187844559 + }, + { + "name": "model.layers.21.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.846908243256621e-05, + "sensitivity": 1.1402759260158555 + }, + { + "name": "model.layers.21.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.328581202476926e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.680865069734864e-05, + "sensitivity": 0.6586736467989712 + }, + { + "name": "model.layers.21.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.472470002132468e-05, + "sensitivity": 0.8804270933809185 + }, + { + "name": "model.layers.21.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.694417038488609e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005938475951552391, + "sensitivity": 0.5416502566170365 + }, + { + "name": "model.layers.21.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.998781933973078e-06, + "sensitivity": 1.3403120055299953 + }, + { + "name": "model.layers.21.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.916719712535269e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 9.702158422442153e-06, + "sensitivity": 1.3978888198182515 + }, + { + "name": "model.layers.21.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1622492820606567e-05, + "sensitivity": 1.2578874620116256 + }, + { + "name": "model.layers.21.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.004314733829233e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007119872607290745, + "sensitivity": 0.5313371725952815 + }, + { + "name": "model.layers.21.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.0241859601810575e-06, + "sensitivity": 2.0972836723120185 + }, + { + "name": "model.layers.21.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.896821224065206e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 4.7952751629054546e-05, + "sensitivity": 0.8504883641154154 + }, + { + "name": "model.layers.21.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.582808418897912e-05, + "sensitivity": 0.8569958708927742 + }, + { + "name": "model.layers.21.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.205947210626618e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007280017016455531, + "sensitivity": 0.5364832208362303 + }, + { + "name": "model.layers.21.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 3.782971816690406e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4380983631999698e-06, + "sensitivity": 2.1007758199750826 + }, + { + "name": "model.layers.21.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.585783237118449e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.21.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.964564489753684e-06, + "sensitivity": 2.1039044575160832 + }, + { + "name": "model.layers.21.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 8.39658150653122e-06, + "sensitivity": 2.11276756029186 + }, + { + "name": "model.layers.21.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00019187886209692806, + "sensitivity": 0.8865392553408962 + }, + { + "name": "model.layers.21.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.7045678760041483e-05, + "sensitivity": 1.3427902773651461 + }, + { + "name": "model.layers.21.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 5, + "mse": 3.0231710752559593e-06, + "sensitivity": 2.0203870733171136 + }, + { + "name": "model.layers.21.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002694542345125228, + "sensitivity": 0.6575331437532186 + }, + { + "name": "model.layers.22.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.56667907605879e-05, + "sensitivity": 0.8483390800657236 + }, + { + "name": "model.layers.22.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0087665032187942e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007416922599077225, + "sensitivity": 0.5616760605953999 + }, + { + "name": "model.layers.22.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.572026904905215e-05, + "sensitivity": 1.0888276061983084 + }, + { + "name": "model.layers.22.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.836781262289151e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.316692451946437e-05, + "sensitivity": 0.665804004245721 + }, + { + "name": "model.layers.22.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.71158598177135e-05, + "sensitivity": 1.113347077749221 + }, + { + "name": "model.layers.22.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.745454245698056e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006312463083304465, + "sensitivity": 0.5453714096967 + }, + { + "name": "model.layers.22.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0667284186638426e-05, + "sensitivity": 1.5706242917853293 + }, + { + "name": "model.layers.22.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.555057320336346e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006635886966250837, + "sensitivity": 0.5468768801696748 + }, + { + "name": "model.layers.22.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7087581808445975e-05, + "sensitivity": 1.1282998578813328 + }, + { + "name": "model.layers.22.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.536180651688483e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.482445703819394e-05, + "sensitivity": 0.6866101348857243 + }, + { + "name": "model.layers.22.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.6337900180806173e-06, + "sensitivity": 2.0973933110073917 + }, + { + "name": "model.layers.22.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.964116548464517e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007536776829510927, + "sensitivity": 0.550156683104402 + }, + { + "name": "model.layers.22.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.105373667087406e-05, + "sensitivity": 1.5163363240948067 + }, + { + "name": "model.layers.22.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.457571769009519e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006607574177905917, + "sensitivity": 0.5957658441687577 + }, + { + "name": "model.layers.22.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.241083610802889e-05, + "sensitivity": 0.9678169495017461 + }, + { + "name": "model.layers.22.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.626940146110428e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.452956586144865e-05, + "sensitivity": 0.609754298182538 + }, + { + "name": "model.layers.22.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.711079575121403e-05, + "sensitivity": 0.9335853188160506 + }, + { + "name": "model.layers.22.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.272758241721021e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006226321565918624, + "sensitivity": 0.55496667450775 + }, + { + "name": "model.layers.22.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.71858327020891e-05, + "sensitivity": 0.6584179212456969 + }, + { + "name": "model.layers.22.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.20395894657122e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006378985708579421, + "sensitivity": 0.5036602016905956 + }, + { + "name": "model.layers.22.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0642343113431707e-05, + "sensitivity": 1.3255387571925519 + }, + { + "name": "model.layers.22.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.008833217194478e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006411510985344648, + "sensitivity": 0.554858466198227 + }, + { + "name": "model.layers.22.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.154163565952331e-05, + "sensitivity": 1.0489646133021868 + }, + { + "name": "model.layers.22.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.735507321944169e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000679934280924499, + "sensitivity": 0.5476577570906018 + }, + { + "name": "model.layers.22.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6347060308326036e-05, + "sensitivity": 0.9368099713264783 + }, + { + "name": "model.layers.22.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.808370577957248e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.551743015530519e-05, + "sensitivity": 0.6783149444246934 + }, + { + "name": "model.layers.22.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.870162203791551e-05, + "sensitivity": 1.1278496277974495 + }, + { + "name": "model.layers.22.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.443484489362163e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7908411690732464e-05, + "sensitivity": 0.7506539027482667 + }, + { + "name": "model.layers.22.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.07698893873021e-05, + "sensitivity": 0.8698657314504603 + }, + { + "name": "model.layers.22.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.645922780990077e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006563437054865062, + "sensitivity": 0.509784640877408 + }, + { + "name": "model.layers.22.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.620387310045771e-05, + "sensitivity": 0.9380033253939282 + }, + { + "name": "model.layers.22.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1663373697956558e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006272218888625503, + "sensitivity": 0.5863626444774883 + }, + { + "name": "model.layers.22.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0950212526950054e-05, + "sensitivity": 1.458229272982133 + }, + { + "name": "model.layers.22.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.772687584088999e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.981250433251262e-05, + "sensitivity": 0.6230769116990666 + }, + { + "name": "model.layers.22.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0223220670013689e-05, + "sensitivity": 1.8400098608640456 + }, + { + "name": "model.layers.22.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.79899960939656e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5586187954759225e-05, + "sensitivity": 0.6163777853223603 + }, + { + "name": "model.layers.22.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0049890988739207e-05, + "sensitivity": 1.382525075042724 + }, + { + "name": "model.layers.22.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.531098281608138e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006045112386345863, + "sensitivity": 0.5260918517310695 + }, + { + "name": "model.layers.22.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1164775060024112e-05, + "sensitivity": 1.2392061189690793 + }, + { + "name": "model.layers.22.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.935045687190723e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006962585030123591, + "sensitivity": 0.5530764193845195 + }, + { + "name": "model.layers.22.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.2094356861780398e-05, + "sensitivity": 1.9631615373680722 + }, + { + "name": "model.layers.22.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.548454732386745e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007478423649445176, + "sensitivity": 0.5237141572394394 + }, + { + "name": "model.layers.22.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.992728256387636e-05, + "sensitivity": 0.64283938750788 + }, + { + "name": "model.layers.22.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.177745603963558e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006630040588788688, + "sensitivity": 0.541999497275556 + }, + { + "name": "model.layers.22.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.938087633694522e-05, + "sensitivity": 0.7892617575982078 + }, + { + "name": "model.layers.22.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.214918582576502e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006710853194817901, + "sensitivity": 0.5315456830090102 + }, + { + "name": "model.layers.22.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7212873798562214e-05, + "sensitivity": 0.8748850829641914 + }, + { + "name": "model.layers.22.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.666423809700063e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006374261574819684, + "sensitivity": 0.5744315837111832 + }, + { + "name": "model.layers.22.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8358309615869075e-05, + "sensitivity": 0.7731973314491084 + }, + { + "name": "model.layers.22.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.203564453244326e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006438556592911482, + "sensitivity": 0.5181801839774159 + }, + { + "name": "model.layers.22.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9135545598110184e-05, + "sensitivity": 0.8112252112411666 + }, + { + "name": "model.layers.22.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.650039037798706e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006629450945183635, + "sensitivity": 0.5291117855717549 + }, + { + "name": "model.layers.22.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0757581549114548e-05, + "sensitivity": 1.2176652244739676 + }, + { + "name": "model.layers.22.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.601946319686249e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006560278125107288, + "sensitivity": 0.5503460601608802 + }, + { + "name": "model.layers.22.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.809578578919172e-05, + "sensitivity": 0.8802972772187485 + }, + { + "name": "model.layers.22.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.908569503139006e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006448211497627199, + "sensitivity": 0.5938683379514424 + }, + { + "name": "model.layers.22.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.322897388599813e-05, + "sensitivity": 0.8824782892315874 + }, + { + "name": "model.layers.22.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.158184303079906e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007096983026713133, + "sensitivity": 0.5131836444099749 + }, + { + "name": "model.layers.22.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.736937600886449e-05, + "sensitivity": 0.8296182816841178 + }, + { + "name": "model.layers.22.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.96952759224223e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000636305776424706, + "sensitivity": 0.5500020689377991 + }, + { + "name": "model.layers.22.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0170171663048677e-05, + "sensitivity": 1.4267925585460308 + }, + { + "name": "model.layers.22.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.71945918181882e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006069838418625295, + "sensitivity": 0.5343719803430172 + }, + { + "name": "model.layers.22.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.199610652402043e-05, + "sensitivity": 0.8666228868541752 + }, + { + "name": "model.layers.22.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.611628234371892e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.004492752254009e-05, + "sensitivity": 0.7627208579755788 + }, + { + "name": "model.layers.22.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.651542207691818e-05, + "sensitivity": 0.8795493610655879 + }, + { + "name": "model.layers.22.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.479551413780428e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.834907981101424e-05, + "sensitivity": 0.6009680495769741 + }, + { + "name": "model.layers.22.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0361793101765215e-05, + "sensitivity": 1.2828177540429133 + }, + { + "name": "model.layers.22.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.962024710650439e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.705348667106591e-05, + "sensitivity": 0.7234874118371908 + }, + { + "name": "model.layers.22.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9844765928573906e-05, + "sensitivity": 1.127527965254845 + }, + { + "name": "model.layers.22.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.451617645732767e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006729811429977417, + "sensitivity": 0.5333905595507623 + }, + { + "name": "model.layers.22.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.822765524499118e-05, + "sensitivity": 0.9899675928909057 + }, + { + "name": "model.layers.22.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.752810458645399e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.816500197397545e-05, + "sensitivity": 0.6585783460990875 + }, + { + "name": "model.layers.22.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.903498822590336e-05, + "sensitivity": 0.816956627817945 + }, + { + "name": "model.layers.22.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.880795121513074e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006612031138502061, + "sensitivity": 0.5298085308966607 + }, + { + "name": "model.layers.22.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.589172360487282e-05, + "sensitivity": 0.946710767029887 + }, + { + "name": "model.layers.22.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.524612210043415e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006221960647962987, + "sensitivity": 0.5574631066020017 + }, + { + "name": "model.layers.22.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.457543349824846e-05, + "sensitivity": 1.1364033967809295 + }, + { + "name": "model.layers.22.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.841090786721907e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007323867175728083, + "sensitivity": 0.5844849447142206 + }, + { + "name": "model.layers.22.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.486240115715191e-05, + "sensitivity": 1.0593538666636677 + }, + { + "name": "model.layers.22.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.616864200419514e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006013004458509386, + "sensitivity": 0.5385024622551718 + }, + { + "name": "model.layers.22.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0558382200542837e-05, + "sensitivity": 1.7843935135047038 + }, + { + "name": "model.layers.22.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.327364184879116e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.594580579781905e-05, + "sensitivity": 0.6761231227382877 + }, + { + "name": "model.layers.22.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.824711115565151e-05, + "sensitivity": 0.9158564102944027 + }, + { + "name": "model.layers.22.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.272023706012988e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006438942509703338, + "sensitivity": 0.563524588999176 + }, + { + "name": "model.layers.22.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0486375686014071e-05, + "sensitivity": 1.253854202281932 + }, + { + "name": "model.layers.22.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.887993097530853e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006188774714246392, + "sensitivity": 0.5775393408245677 + }, + { + "name": "model.layers.22.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.140892618423095e-05, + "sensitivity": 1.4771172986162353 + }, + { + "name": "model.layers.22.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.235104817482352e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.844766565132886e-05, + "sensitivity": 0.6902943360675445 + }, + { + "name": "model.layers.22.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1369505045877304e-05, + "sensitivity": 1.223487706050514 + }, + { + "name": "model.layers.22.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.682168418592482e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000683480582665652, + "sensitivity": 0.5142055952849968 + }, + { + "name": "model.layers.22.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1346650353516452e-05, + "sensitivity": 1.2080392934177522 + }, + { + "name": "model.layers.22.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.482274557129131e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006929466035217047, + "sensitivity": 0.5384676250720434 + }, + { + "name": "model.layers.22.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0431626479839906e-05, + "sensitivity": 0.7961475076026204 + }, + { + "name": "model.layers.22.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.048578254398308e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.1097439710283652e-05, + "sensitivity": 1.2150817957415367 + }, + { + "name": "model.layers.22.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0472302720882e-05, + "sensitivity": 0.7868762509615068 + }, + { + "name": "model.layers.22.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2184758588773548e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006675118347629905, + "sensitivity": 0.5550824361880548 + }, + { + "name": "model.layers.22.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.974400482955389e-05, + "sensitivity": 0.8872055494691227 + }, + { + "name": "model.layers.22.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.016169891154277e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8037428971147165e-05, + "sensitivity": 0.6159250152935878 + }, + { + "name": "model.layers.22.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0642168490448967e-05, + "sensitivity": 1.7828401202531037 + }, + { + "name": "model.layers.22.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0724006642703898e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.63515568501316e-05, + "sensitivity": 0.8935013505815995 + }, + { + "name": "model.layers.22.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.656555342487991e-05, + "sensitivity": 1.0456408203187184 + }, + { + "name": "model.layers.22.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.021084585772769e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00078695232514292, + "sensitivity": 0.5863430661568206 + }, + { + "name": "model.layers.22.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.89020928600803e-05, + "sensitivity": 0.9534578861171656 + }, + { + "name": "model.layers.22.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.9791244666485e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006519048474729061, + "sensitivity": 0.5839464336355608 + }, + { + "name": "model.layers.22.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0605544048303273e-05, + "sensitivity": 1.4958930512609527 + }, + { + "name": "model.layers.22.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.618017434651847e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7752062275540084e-05, + "sensitivity": 0.6939942943588301 + }, + { + "name": "model.layers.22.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1237374565098435e-05, + "sensitivity": 1.314535137599238 + }, + { + "name": "model.layers.22.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.37388211544021e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000686120125465095, + "sensitivity": 0.5338432669317794 + }, + { + "name": "model.layers.22.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.153186404844746e-05, + "sensitivity": 0.8200776520695697 + }, + { + "name": "model.layers.22.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.728510240667674e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006930383387953043, + "sensitivity": 0.5129730418476924 + }, + { + "name": "model.layers.22.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.799957943963818e-05, + "sensitivity": 0.9908800571694502 + }, + { + "name": "model.layers.22.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.267640509984631e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006350053008645773, + "sensitivity": 0.5164301875345324 + }, + { + "name": "model.layers.22.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.082585185940843e-05, + "sensitivity": 1.6754269175694971 + }, + { + "name": "model.layers.22.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.013651952547661e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.892355693504214e-05, + "sensitivity": 0.7312412486972154 + }, + { + "name": "model.layers.22.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.56390659767203e-05, + "sensitivity": 0.8863351862902266 + }, + { + "name": "model.layers.22.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.589617444456962e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006184853264130652, + "sensitivity": 0.5051559251716705 + }, + { + "name": "model.layers.22.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.885845429380424e-06, + "sensitivity": 1.5075894270006305 + }, + { + "name": "model.layers.22.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.500391466739529e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005972343496978283, + "sensitivity": 0.537126667807763 + }, + { + "name": "model.layers.22.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.338371192920022e-05, + "sensitivity": 0.9436815487719153 + }, + { + "name": "model.layers.22.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.395060043156263e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.1940802222816274e-05, + "sensitivity": 0.708979275086528 + }, + { + "name": "model.layers.22.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.732461042702198e-05, + "sensitivity": 0.8955151414200511 + }, + { + "name": "model.layers.22.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.632192359276814e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.989724352024496e-05, + "sensitivity": 0.8226693272360504 + }, + { + "name": "model.layers.22.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0563817340880632e-05, + "sensitivity": 1.7494980889471252 + }, + { + "name": "model.layers.22.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.028306410778896e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7864577684085816e-05, + "sensitivity": 1.1591246934646517 + }, + { + "name": "model.layers.22.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8767891459865496e-05, + "sensitivity": 1.0017397619736792 + }, + { + "name": "model.layers.22.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.561466190963984e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000665161176584661, + "sensitivity": 0.5302874364624178 + }, + { + "name": "model.layers.22.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0696282162098214e-05, + "sensitivity": 0.6513029535247876 + }, + { + "name": "model.layers.22.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.735765166216879e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006683942629024386, + "sensitivity": 0.5555399238038377 + }, + { + "name": "model.layers.22.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 3.8034768294892274e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.46106242229871e-06, + "sensitivity": 2.0996964644812257 + }, + { + "name": "model.layers.22.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.044948577255127e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.22.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 8.600967703387141e-06, + "sensitivity": 1.6482784280074676 + }, + { + "name": "model.layers.22.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 2.7693076845025644e-05, + "sensitivity": 1.6086821538531093 + }, + { + "name": "model.layers.22.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.0001773597177816555, + "sensitivity": 0.9708254655408286 + }, + { + "name": "model.layers.22.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.5107136277947575e-05, + "sensitivity": 1.3416098007019635 + }, + { + "name": "model.layers.22.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.886990038561635e-05, + "sensitivity": 0.7131944384569984 + }, + { + "name": "model.layers.22.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002624464686959982, + "sensitivity": 0.7164823237599173 + }, + { + "name": "model.layers.23.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0344770089432131e-05, + "sensitivity": 1.5194623680602186 + }, + { + "name": "model.layers.23.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.972101687097165e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6620057875989005e-05, + "sensitivity": 0.8099467798314249 + }, + { + "name": "model.layers.23.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.798436905024573e-05, + "sensitivity": 1.1802072109247421 + }, + { + "name": "model.layers.23.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.053737019508844e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006465916521847248, + "sensitivity": 0.5407696985671706 + }, + { + "name": "model.layers.23.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9053149016108364e-05, + "sensitivity": 0.7798696515253496 + }, + { + "name": "model.layers.23.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1584390904317843e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.893657362321392e-05, + "sensitivity": 0.7025216735954837 + }, + { + "name": "model.layers.23.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.968369805486873e-05, + "sensitivity": 0.6331506381337162 + }, + { + "name": "model.layers.23.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.475256325051305e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.967367178527638e-05, + "sensitivity": 0.6149050173845396 + }, + { + "name": "model.layers.23.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.839138611918315e-05, + "sensitivity": 0.7234902885809288 + }, + { + "name": "model.layers.23.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.423817234870512e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000662479258608073, + "sensitivity": 0.5315885651419796 + }, + { + "name": "model.layers.23.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006731246830895543, + "sensitivity": 0.5829385991034397 + }, + { + "name": "model.layers.23.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.101388632690941e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006843781447969377, + "sensitivity": 0.5459808695991265 + }, + { + "name": "model.layers.23.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.465174374170601e-05, + "sensitivity": 0.9254648759080065 + }, + { + "name": "model.layers.23.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.437041631419561e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007354131666943431, + "sensitivity": 0.5204560499137848 + }, + { + "name": "model.layers.23.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8443845773581415e-05, + "sensitivity": 0.6900153898584416 + }, + { + "name": "model.layers.23.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.149862770143955e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000630149501375854, + "sensitivity": 0.5449572336200611 + }, + { + "name": "model.layers.23.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.855241761310026e-05, + "sensitivity": 0.9740901538351319 + }, + { + "name": "model.layers.23.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.223286502267001e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8324098063167185e-05, + "sensitivity": 0.6907986423650871 + }, + { + "name": "model.layers.23.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007308712229132652, + "sensitivity": 0.5850234997915367 + }, + { + "name": "model.layers.23.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.369010740556405e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007723450544290245, + "sensitivity": 0.5584750705410588 + }, + { + "name": "model.layers.23.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.163332727737725e-05, + "sensitivity": 0.8090881845454014 + }, + { + "name": "model.layers.23.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.593532013241202e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.331225449685007e-05, + "sensitivity": 0.7615802767329417 + }, + { + "name": "model.layers.23.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.735422018915415e-05, + "sensitivity": 1.0389225779963935 + }, + { + "name": "model.layers.23.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.076163572288351e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006445469916798174, + "sensitivity": 0.547177579177943 + }, + { + "name": "model.layers.23.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7498102250974625e-05, + "sensitivity": 0.7202523338434988 + }, + { + "name": "model.layers.23.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.572108190994186e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006437463453039527, + "sensitivity": 0.5747571934558269 + }, + { + "name": "model.layers.23.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1325179002596997e-05, + "sensitivity": 1.987920095991545 + }, + { + "name": "model.layers.23.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.974173286129371e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.054944242350757e-05, + "sensitivity": 0.6512364315351131 + }, + { + "name": "model.layers.23.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.734761361964047e-05, + "sensitivity": 1.0387054651898644 + }, + { + "name": "model.layers.23.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.376187116075016e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006259295041672885, + "sensitivity": 0.5252295845267203 + }, + { + "name": "model.layers.23.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.389809277607128e-05, + "sensitivity": 0.6399782859720696 + }, + { + "name": "model.layers.23.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.727535825732048e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.403546285582706e-05, + "sensitivity": 0.7493024997693607 + }, + { + "name": "model.layers.23.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6457327445968986e-05, + "sensitivity": 0.6122299494613926 + }, + { + "name": "model.layers.23.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0396089464848046e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006270084413699806, + "sensitivity": 0.5282887593032334 + }, + { + "name": "model.layers.23.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.947591125732288e-05, + "sensitivity": 0.9327136112730321 + }, + { + "name": "model.layers.23.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.625344894928276e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006714216433465481, + "sensitivity": 0.5854103474839663 + }, + { + "name": "model.layers.23.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.689120345981792e-05, + "sensitivity": 0.8182049723496883 + }, + { + "name": "model.layers.23.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.007185445218056e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007574408082291484, + "sensitivity": 0.5866569752687196 + }, + { + "name": "model.layers.23.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1368038940418046e-05, + "sensitivity": 1.5985122811774852 + }, + { + "name": "model.layers.23.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.825770123621623e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.071916868677363e-05, + "sensitivity": 0.7154548556375024 + }, + { + "name": "model.layers.23.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.845763371326029e-05, + "sensitivity": 0.6326880284135424 + }, + { + "name": "model.layers.23.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.976515234986437e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7839024520944804e-05, + "sensitivity": 0.9150978326954551 + }, + { + "name": "model.layers.23.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006567409145645797, + "sensitivity": 0.5703766354537058 + }, + { + "name": "model.layers.23.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.988771244527015e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006348647875711322, + "sensitivity": 0.5657077060360924 + }, + { + "name": "model.layers.23.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0848302382510155e-05, + "sensitivity": 0.7985769552937871 + }, + { + "name": "model.layers.23.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.878710223645612e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006547847297042608, + "sensitivity": 0.5406073092503514 + }, + { + "name": "model.layers.23.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0666908565326594e-05, + "sensitivity": 1.7568588880858418 + }, + { + "name": "model.layers.23.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.991151053625799e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006521636387333274, + "sensitivity": 0.545379176901954 + }, + { + "name": "model.layers.23.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9881331253563985e-05, + "sensitivity": 1.0899271601975011 + }, + { + "name": "model.layers.23.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.40544123800646e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006692990427836776, + "sensitivity": 0.5494588937905218 + }, + { + "name": "model.layers.23.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.879232776351273e-05, + "sensitivity": 0.8106012695415316 + }, + { + "name": "model.layers.23.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.295632033470611e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006546465447172523, + "sensitivity": 0.5308143932456463 + }, + { + "name": "model.layers.23.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7730834669200704e-05, + "sensitivity": 0.8455102166877334 + }, + { + "name": "model.layers.23.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.560132300772239e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.407911885413341e-05, + "sensitivity": 0.6459628123871882 + }, + { + "name": "model.layers.23.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.408502667909488e-05, + "sensitivity": 0.7391221263922982 + }, + { + "name": "model.layers.23.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.891662789916154e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.435107934521511e-05, + "sensitivity": 0.7727401931709401 + }, + { + "name": "model.layers.23.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1191611520189326e-05, + "sensitivity": 1.701589804272902 + }, + { + "name": "model.layers.23.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.59958197704691e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0106754972366616e-05, + "sensitivity": 0.6283119387103795 + }, + { + "name": "model.layers.23.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.551648064283654e-05, + "sensitivity": 0.9535833665992497 + }, + { + "name": "model.layers.23.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.50962419967982e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006053246324881911, + "sensitivity": 0.5258176047548305 + }, + { + "name": "model.layers.23.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.295957427937537e-05, + "sensitivity": 0.7311575489518543 + }, + { + "name": "model.layers.23.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.713862709759269e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007193150813691318, + "sensitivity": 0.5742119652763369 + }, + { + "name": "model.layers.23.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.042717723175883e-05, + "sensitivity": 0.9414144913039996 + }, + { + "name": "model.layers.23.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.212848001676321e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.012164521962404e-05, + "sensitivity": 0.6178189584342826 + }, + { + "name": "model.layers.23.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0573603503871709e-05, + "sensitivity": 1.4148434419702227 + }, + { + "name": "model.layers.23.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.089459247959894e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006368387257680297, + "sensitivity": 0.5225359640847094 + }, + { + "name": "model.layers.23.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.935625813435763e-05, + "sensitivity": 0.6747077547165619 + }, + { + "name": "model.layers.23.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.542618050138117e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006606288952752948, + "sensitivity": 0.5473435111469347 + }, + { + "name": "model.layers.23.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.404926534742117e-05, + "sensitivity": 0.8899763051698821 + }, + { + "name": "model.layers.23.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.671967179907369e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.300906534306705e-05, + "sensitivity": 0.600380698401833 + }, + { + "name": "model.layers.23.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.015099279466085e-05, + "sensitivity": 0.816960628129437 + }, + { + "name": "model.layers.23.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.472411655522592e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006699608638882637, + "sensitivity": 0.5821121422874357 + }, + { + "name": "model.layers.23.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.389273792388849e-05, + "sensitivity": 0.6313974277669374 + }, + { + "name": "model.layers.23.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.976168040433549e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006152235437184572, + "sensitivity": 0.586383065151956 + }, + { + "name": "model.layers.23.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.399668200174347e-05, + "sensitivity": 0.9940653674707804 + }, + { + "name": "model.layers.23.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.917273023849702e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007643412100151181, + "sensitivity": 0.5771344490527444 + }, + { + "name": "model.layers.23.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0907485375355463e-05, + "sensitivity": 1.4598568322800671 + }, + { + "name": "model.layers.23.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.800564046396175e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5692315072519705e-05, + "sensitivity": 0.7275793084576685 + }, + { + "name": "model.layers.23.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.083292464609258e-05, + "sensitivity": 1.1272612840394125 + }, + { + "name": "model.layers.23.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.126334023472737e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.181707431096584e-05, + "sensitivity": 0.8710483636421799 + }, + { + "name": "model.layers.23.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.230451253941283e-05, + "sensitivity": 0.8364537727195583 + }, + { + "name": "model.layers.23.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.395862778343144e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007110959850251675, + "sensitivity": 0.5194094661328419 + }, + { + "name": "model.layers.23.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1245319001318421e-05, + "sensitivity": 1.3832111206010302 + }, + { + "name": "model.layers.23.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.473218369748793e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006979455938562751, + "sensitivity": 0.5748708793533971 + }, + { + "name": "model.layers.23.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.201693759066984e-05, + "sensitivity": 1.1494530558457474 + }, + { + "name": "model.layers.23.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.804853001085576e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006895688129588962, + "sensitivity": 0.5954026503269555 + }, + { + "name": "model.layers.23.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.206110573548358e-05, + "sensitivity": 1.4599017219590174 + }, + { + "name": "model.layers.23.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.246200781679363e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.551800470333546e-05, + "sensitivity": 0.8261366257562447 + }, + { + "name": "model.layers.23.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0060684871859848e-05, + "sensitivity": 1.9725452279880398 + }, + { + "name": "model.layers.23.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.311898914646008e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.208549555391073e-05, + "sensitivity": 0.6794733054360207 + }, + { + "name": "model.layers.23.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.904023419134319e-05, + "sensitivity": 0.8533573873948748 + }, + { + "name": "model.layers.23.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.429813765862491e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006444841856136918, + "sensitivity": 0.5407334537006119 + }, + { + "name": "model.layers.23.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.47583622392267e-05, + "sensitivity": 1.0912380550073626 + }, + { + "name": "model.layers.23.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.69008784370817e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006082548061385751, + "sensitivity": 0.5270244483420728 + }, + { + "name": "model.layers.23.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.762826185673475e-05, + "sensitivity": 1.1961303692694545 + }, + { + "name": "model.layers.23.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.276253649659338e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006592716090381145, + "sensitivity": 0.5635429416214035 + }, + { + "name": "model.layers.23.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1133539373986423e-05, + "sensitivity": 1.608687981314394 + }, + { + "name": "model.layers.23.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.016695798891305e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.116547592682764e-05, + "sensitivity": 0.6310444527648402 + }, + { + "name": "model.layers.23.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.060164014343172e-05, + "sensitivity": 0.9353490282968993 + }, + { + "name": "model.layers.23.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.526051604145323e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000683646067045629, + "sensitivity": 0.5494155797572733 + }, + { + "name": "model.layers.23.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.790566501673311e-05, + "sensitivity": 0.7976481127560685 + }, + { + "name": "model.layers.23.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.688896974083036e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.765180685557425e-05, + "sensitivity": 0.7379909246330951 + }, + { + "name": "model.layers.23.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.364659591577947e-05, + "sensitivity": 0.8815622405654898 + }, + { + "name": "model.layers.23.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.26893574665155e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.198080907575786e-05, + "sensitivity": 0.9165106798231014 + }, + { + "name": "model.layers.23.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7623656175564975e-05, + "sensitivity": 0.7959622603557931 + }, + { + "name": "model.layers.23.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.85663758051669e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006553898565471172, + "sensitivity": 0.5240360123057535 + }, + { + "name": "model.layers.23.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0623715752444696e-05, + "sensitivity": 1.5529395909487436 + }, + { + "name": "model.layers.23.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.937719033179746e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.827764834975824e-05, + "sensitivity": 0.9891454583356069 + }, + { + "name": "model.layers.23.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.022103480063379e-05, + "sensitivity": 1.1310886239630578 + }, + { + "name": "model.layers.23.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2074810911144596e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.134886643849313e-05, + "sensitivity": 0.9520962296511072 + }, + { + "name": "model.layers.23.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.787921691080555e-05, + "sensitivity": 0.7542097835251735 + }, + { + "name": "model.layers.23.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.574249932280509e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000647238630335778, + "sensitivity": 0.5362168616936781 + }, + { + "name": "model.layers.23.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6341232266277075e-05, + "sensitivity": 0.9510503105197246 + }, + { + "name": "model.layers.23.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.251464921864681e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000620881502982229, + "sensitivity": 0.5878523916127308 + }, + { + "name": "model.layers.23.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.860783130628988e-05, + "sensitivity": 0.8261243888233641 + }, + { + "name": "model.layers.23.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.001381507303449e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006395687814801931, + "sensitivity": 0.5221573542942948 + }, + { + "name": "model.layers.23.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.502608837559819e-05, + "sensitivity": 0.9753307117944833 + }, + { + "name": "model.layers.23.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.92521814724023e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.355502071324736e-05, + "sensitivity": 0.6257292339431655 + }, + { + "name": "model.layers.23.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.149370165076107e-05, + "sensitivity": 0.9846719403853545 + }, + { + "name": "model.layers.23.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.392737870759447e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006734089693054557, + "sensitivity": 0.5861094716957109 + }, + { + "name": "model.layers.23.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8694975450634956e-05, + "sensitivity": 0.6419246145981509 + }, + { + "name": "model.layers.23.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.034480967784475e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00066488201264292, + "sensitivity": 0.5452565258251397 + }, + { + "name": "model.layers.23.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.439764547394589e-05, + "sensitivity": 1.0333184529058272 + }, + { + "name": "model.layers.23.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.722758479962067e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007382944459095597, + "sensitivity": 0.5452297900109437 + }, + { + "name": "model.layers.23.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.637526530539617e-05, + "sensitivity": 1.0154652424565567 + }, + { + "name": "model.layers.23.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.62149170441262e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.713804032187909e-05, + "sensitivity": 0.6738393318943545 + }, + { + "name": "model.layers.23.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.69842777622398e-05, + "sensitivity": 1.1432429899809091 + }, + { + "name": "model.layers.23.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.54938844490971e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006202874938026071, + "sensitivity": 0.5134257167038849 + }, + { + "name": "model.layers.23.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 4.106113010493573e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.584149665897712e-06, + "sensitivity": 1.9805164116591907 + }, + { + "name": "model.layers.23.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.770854265094385e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.23.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 2.115526285706437e-06, + "sensitivity": 2.103942094838983 + }, + { + "name": "model.layers.23.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 6.459436917793937e-06, + "sensitivity": 2.001088489728363 + }, + { + "name": "model.layers.23.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00016866796067915857, + "sensitivity": 0.9043927123252187 + }, + { + "name": "model.layers.23.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.3943327758170199e-05, + "sensitivity": 0.9641423448274783 + }, + { + "name": "model.layers.23.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 4, + "mse": 1.1663777513604145e-05, + "sensitivity": 1.4523839266687488 + }, + { + "name": "model.layers.23.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.000247941876295954, + "sensitivity": 0.7656354394975902 + }, + { + "name": "model.layers.24.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3101101760403253e-06, + "sensitivity": 2.097498756429942 + }, + { + "name": "model.layers.24.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.166096788248979e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006460563745349646, + "sensitivity": 0.5822346385488447 + }, + { + "name": "model.layers.24.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.239144568098709e-05, + "sensitivity": 0.8419268987271631 + }, + { + "name": "model.layers.24.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.13512577021902e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000701237004250288, + "sensitivity": 0.5340104688834474 + }, + { + "name": "model.layers.24.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.567063271882944e-05, + "sensitivity": 1.075776186682438 + }, + { + "name": "model.layers.24.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0221291404377553e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.724414222640917e-05, + "sensitivity": 0.6238970051273653 + }, + { + "name": "model.layers.24.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1388836355763488e-05, + "sensitivity": 1.476937638234124 + }, + { + "name": "model.layers.24.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.754909804840281e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7280045439256355e-05, + "sensitivity": 0.7365326791978575 + }, + { + "name": "model.layers.24.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8917197748087347e-05, + "sensitivity": 0.7919049149805171 + }, + { + "name": "model.layers.24.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.225620268196508e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006562242051586509, + "sensitivity": 0.5502417761636298 + }, + { + "name": "model.layers.24.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.126459629740566e-05, + "sensitivity": 0.9411614469465197 + }, + { + "name": "model.layers.24.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.313999847407104e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006796446396037936, + "sensitivity": 0.5583067123761776 + }, + { + "name": "model.layers.24.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.104196654632688e-05, + "sensitivity": 0.6808956853384065 + }, + { + "name": "model.layers.24.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.528709483674902e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.141296762507409e-05, + "sensitivity": 0.6052810448423196 + }, + { + "name": "model.layers.24.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.881843728478998e-05, + "sensitivity": 1.0969884890372692 + }, + { + "name": "model.layers.24.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.527338988846168e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.026315142866224e-05, + "sensitivity": 0.7505424705024761 + }, + { + "name": "model.layers.24.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.19579732301645e-05, + "sensitivity": 0.7653969001937377 + }, + { + "name": "model.layers.24.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.451030109630665e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.180327909532934e-05, + "sensitivity": 0.62838929593993 + }, + { + "name": "model.layers.24.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.19618222117424e-05, + "sensitivity": 0.9536534773642711 + }, + { + "name": "model.layers.24.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.862980737627367e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000681792851537466, + "sensitivity": 0.5121415048969691 + }, + { + "name": "model.layers.24.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.377277951381984e-06, + "sensitivity": 2.0971398448596315 + }, + { + "name": "model.layers.24.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.087228712203796e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.637483991449699e-05, + "sensitivity": 0.8367330787007305 + }, + { + "name": "model.layers.24.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006845964817330241, + "sensitivity": 0.5788298693710906 + }, + { + "name": "model.layers.24.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.739252285115072e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006864133174531162, + "sensitivity": 0.5247952235783319 + }, + { + "name": "model.layers.24.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.281426612986252e-05, + "sensitivity": 0.9186774728603584 + }, + { + "name": "model.layers.24.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0829402299350477e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.345783185679466e-05, + "sensitivity": 0.6500530527072678 + }, + { + "name": "model.layers.24.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.098053326131776e-05, + "sensitivity": 1.7576605422890417 + }, + { + "name": "model.layers.24.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.737512982610497e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8556739531923085e-05, + "sensitivity": 0.7566216553860602 + }, + { + "name": "model.layers.24.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.182257493492216e-05, + "sensitivity": 1.124029333124639 + }, + { + "name": "model.layers.24.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.221560960919305e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.27022236585617e-05, + "sensitivity": 0.729859516950556 + }, + { + "name": "model.layers.24.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.990046702208929e-05, + "sensitivity": 0.6712516084924582 + }, + { + "name": "model.layers.24.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.412969580400386e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006706073763780296, + "sensitivity": 0.5697078914955702 + }, + { + "name": "model.layers.24.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9829482779605314e-05, + "sensitivity": 0.6399838696236848 + }, + { + "name": "model.layers.24.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.75678017816972e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000674064620397985, + "sensitivity": 0.5503889236785967 + }, + { + "name": "model.layers.24.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.074592728400603e-05, + "sensitivity": 1.210066734533182 + }, + { + "name": "model.layers.24.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.96288122223632e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.016989209456369e-05, + "sensitivity": 0.6042026914884189 + }, + { + "name": "model.layers.24.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.23895030003041e-05, + "sensitivity": 1.1950439471455778 + }, + { + "name": "model.layers.24.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.630090976817883e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000698382849805057, + "sensitivity": 0.541293369645206 + }, + { + "name": "model.layers.24.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.3548818060371559e-05, + "sensitivity": 1.313149006493195 + }, + { + "name": "model.layers.24.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.878849490021821e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.107302371878177e-05, + "sensitivity": 0.8574388053014641 + }, + { + "name": "model.layers.24.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3835850849281996e-05, + "sensitivity": 1.1365424828827473 + }, + { + "name": "model.layers.24.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.402996758770314e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.535260424949229e-05, + "sensitivity": 0.8371759659242822 + }, + { + "name": "model.layers.24.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.898263771086931e-05, + "sensitivity": 0.9113514334100313 + }, + { + "name": "model.layers.24.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2283056776141166e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.922736818320118e-05, + "sensitivity": 0.8874386103524159 + }, + { + "name": "model.layers.24.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0770268090709578e-05, + "sensitivity": 1.4570369457867736 + }, + { + "name": "model.layers.24.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.33263994131994e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006285202107392251, + "sensitivity": 0.5741495354073028 + }, + { + "name": "model.layers.24.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1003145118593238e-05, + "sensitivity": 1.212075173725774 + }, + { + "name": "model.layers.24.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.576364507462131e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000683597638271749, + "sensitivity": 0.5649832509339734 + }, + { + "name": "model.layers.24.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.065877586370334e-05, + "sensitivity": 1.2804553872179476 + }, + { + "name": "model.layers.24.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.69165853348386e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006455188849940896, + "sensitivity": 0.527263069237397 + }, + { + "name": "model.layers.24.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.38758938293904e-05, + "sensitivity": 0.9701758806713681 + }, + { + "name": "model.layers.24.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.689635594942956e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007257977849803865, + "sensitivity": 0.5575498435728026 + }, + { + "name": "model.layers.24.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.379558180924505e-05, + "sensitivity": 0.633479862693713 + }, + { + "name": "model.layers.24.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.006500138435513e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.424727325793356e-05, + "sensitivity": 0.6211253468110328 + }, + { + "name": "model.layers.24.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0721246326284017e-05, + "sensitivity": 1.3518969577954791 + }, + { + "name": "model.layers.24.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.301311827883183e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006434733513742685, + "sensitivity": 0.5483611292361205 + }, + { + "name": "model.layers.24.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7765544624999166e-05, + "sensitivity": 0.9530281586620297 + }, + { + "name": "model.layers.24.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.962465934317152e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000654479255899787, + "sensitivity": 0.558429611734185 + }, + { + "name": "model.layers.24.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.293647311395034e-05, + "sensitivity": 0.6824504092662931 + }, + { + "name": "model.layers.24.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.2765277536746e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.308119191089645e-05, + "sensitivity": 0.6473609417607884 + }, + { + "name": "model.layers.24.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.230151484487578e-05, + "sensitivity": 0.786045035999273 + }, + { + "name": "model.layers.24.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.578475222340785e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.253697210922837e-05, + "sensitivity": 0.634445163643696 + }, + { + "name": "model.layers.24.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6325672630919144e-05, + "sensitivity": 1.1053331657455396 + }, + { + "name": "model.layers.24.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.854134315086412e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006331233307719231, + "sensitivity": 0.5400867067219166 + }, + { + "name": "model.layers.24.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0735990144894458e-05, + "sensitivity": 1.8083117699560873 + }, + { + "name": "model.layers.24.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.506873900325445e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.502840940607712e-05, + "sensitivity": 0.9100078257138581 + }, + { + "name": "model.layers.24.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.868079460924491e-05, + "sensitivity": 1.0494545958969714 + }, + { + "name": "model.layers.24.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.619117579655722e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006558973109349608, + "sensitivity": 0.5810709301784469 + }, + { + "name": "model.layers.24.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0673756150936242e-05, + "sensitivity": 1.2066349701065369 + }, + { + "name": "model.layers.24.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.823955456842668e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006472342065535486, + "sensitivity": 0.5521608515462972 + }, + { + "name": "model.layers.24.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.036263584974222e-05, + "sensitivity": 0.994337588321382 + }, + { + "name": "model.layers.24.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.74975967235514e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.867867366760038e-05, + "sensitivity": 0.753702432917827 + }, + { + "name": "model.layers.24.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0582649894058704e-05, + "sensitivity": 0.9633664550910637 + }, + { + "name": "model.layers.24.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.676191557948187e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000666131149046123, + "sensitivity": 0.5609909368165344 + }, + { + "name": "model.layers.24.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.99828599661123e-05, + "sensitivity": 0.9996903616095623 + }, + { + "name": "model.layers.24.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.510273919957399e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006490254309028387, + "sensitivity": 0.5806831536599573 + }, + { + "name": "model.layers.24.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.116055737948045e-05, + "sensitivity": 1.1638283119288924 + }, + { + "name": "model.layers.24.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.127702812998905e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006891604280099273, + "sensitivity": 0.5283744765108511 + }, + { + "name": "model.layers.24.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0957405720546376e-05, + "sensitivity": 1.2149797354096572 + }, + { + "name": "model.layers.24.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.181051842053421e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006686467677354813, + "sensitivity": 0.5618212514991637 + }, + { + "name": "model.layers.24.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7066205044975504e-05, + "sensitivity": 1.1126727803095082 + }, + { + "name": "model.layers.24.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.40406107979652e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.587047780863941e-05, + "sensitivity": 0.729550181187613 + }, + { + "name": "model.layers.24.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0730101166700479e-05, + "sensitivity": 1.4753435243166644 + }, + { + "name": "model.layers.24.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3472138107317733e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.415573104983196e-05, + "sensitivity": 0.9960226837431138 + }, + { + "name": "model.layers.24.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.990861609461717e-05, + "sensitivity": 1.1485472508698686 + }, + { + "name": "model.layers.24.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.694502528465819e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8173289289698005e-05, + "sensitivity": 0.6306223194539833 + }, + { + "name": "model.layers.24.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0163108527194709e-05, + "sensitivity": 1.599964894251045 + }, + { + "name": "model.layers.24.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.050348702046904e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.4562664445256814e-05, + "sensitivity": 0.6166827874974443 + }, + { + "name": "model.layers.24.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.822442108183168e-05, + "sensitivity": 1.1979137493980454 + }, + { + "name": "model.layers.24.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.319021395029267e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006293452461250126, + "sensitivity": 0.5243806543341578 + }, + { + "name": "model.layers.24.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.056778511265293e-05, + "sensitivity": 0.6298051871574949 + }, + { + "name": "model.layers.24.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.083143600539188e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006835462991148233, + "sensitivity": 0.551135456602543 + }, + { + "name": "model.layers.24.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.124116352002602e-05, + "sensitivity": 1.212751631181938 + }, + { + "name": "model.layers.24.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2752592510878458e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.897781375097111e-05, + "sensitivity": 0.9952740060659527 + }, + { + "name": "model.layers.24.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.248210411285982e-05, + "sensitivity": 0.7748557148522042 + }, + { + "name": "model.layers.24.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.206530542840483e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006776286172680557, + "sensitivity": 0.5538494671792241 + }, + { + "name": "model.layers.24.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0782484423543792e-05, + "sensitivity": 1.4106850234790977 + }, + { + "name": "model.layers.24.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.655869123685989e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006525579374283552, + "sensitivity": 0.5842808944356076 + }, + { + "name": "model.layers.24.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3476841306546703e-06, + "sensitivity": 2.0972166832124017 + }, + { + "name": "model.layers.24.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.907204573915806e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.486647569341585e-05, + "sensitivity": 0.8810614361555321 + }, + { + "name": "model.layers.24.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.780210242141038e-05, + "sensitivity": 1.0335258205273472 + }, + { + "name": "model.layers.24.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.420611490895681e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.889079668326303e-05, + "sensitivity": 0.6305333402819896 + }, + { + "name": "model.layers.24.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.912439519306645e-05, + "sensitivity": 0.9605757333577826 + }, + { + "name": "model.layers.24.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.538449947081972e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006573281134478748, + "sensitivity": 0.5604943414586883 + }, + { + "name": "model.layers.24.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7212859246646985e-05, + "sensitivity": 0.8346824688577925 + }, + { + "name": "model.layers.24.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.99485405877931e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5804059229558334e-05, + "sensitivity": 0.6300873937943311 + }, + { + "name": "model.layers.24.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.263878458412364e-05, + "sensitivity": 0.939136365055999 + }, + { + "name": "model.layers.24.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.99798340772395e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006797324167564511, + "sensitivity": 0.5515761717323965 + }, + { + "name": "model.layers.24.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.742678669979796e-05, + "sensitivity": 0.7200637523853529 + }, + { + "name": "model.layers.24.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.808769962342922e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007576106581836939, + "sensitivity": 0.5590005969124842 + }, + { + "name": "model.layers.24.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0697312063712161e-05, + "sensitivity": 1.3295917516081444 + }, + { + "name": "model.layers.24.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.167903047251457e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000635925680398941, + "sensitivity": 0.5942573439408205 + }, + { + "name": "model.layers.24.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1199506843695417e-05, + "sensitivity": 1.3092014527289029 + }, + { + "name": "model.layers.24.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3899286841478897e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9886235248995945e-05, + "sensitivity": 0.7095641792791587 + }, + { + "name": "model.layers.24.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.664139098371379e-05, + "sensitivity": 0.8571310282777946 + }, + { + "name": "model.layers.24.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.193651410692837e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.529048212338239e-05, + "sensitivity": 0.684190293664042 + }, + { + "name": "model.layers.24.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.004059105180204e-05, + "sensitivity": 0.7645255779930702 + }, + { + "name": "model.layers.24.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.306298582283489e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006880129221826792, + "sensitivity": 0.5387919632290868 + }, + { + "name": "model.layers.24.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.230159488040954e-05, + "sensitivity": 0.9156547575545235 + }, + { + "name": "model.layers.24.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0040537290478824e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.1015598475933075e-05, + "sensitivity": 0.6049721614116705 + }, + { + "name": "model.layers.24.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.245731436938513e-05, + "sensitivity": 1.4419565248472832 + }, + { + "name": "model.layers.24.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.423937967767415e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.96554416208528e-05, + "sensitivity": 0.8734700975680405 + }, + { + "name": "model.layers.24.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.199470954015851e-05, + "sensitivity": 1.0667263595542007 + }, + { + "name": "model.layers.24.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.628411028941628e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006832791259512305, + "sensitivity": 0.5470922012191087 + }, + { + "name": "model.layers.24.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.935063381912187e-05, + "sensitivity": 0.9619607620254229 + }, + { + "name": "model.layers.24.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.941553121781908e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006706849671900272, + "sensitivity": 0.5213310164468583 + }, + { + "name": "model.layers.24.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.600825872737914e-05, + "sensitivity": 1.1744746305933358 + }, + { + "name": "model.layers.24.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.518222784914542e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007472659926861525, + "sensitivity": 0.5589237175330197 + }, + { + "name": "model.layers.24.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 3.871424269163981e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4003320504562e-06, + "sensitivity": 2.101964718526645 + }, + { + "name": "model.layers.24.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.987067990849027e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.24.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 8.952685675467364e-06, + "sensitivity": 1.2515614607251746 + }, + { + "name": "model.layers.24.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 7.875893061282113e-06, + "sensitivity": 2.052384444753904 + }, + { + "name": "model.layers.24.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.0001954666804522276, + "sensitivity": 0.9159879468535314 + }, + { + "name": "model.layers.24.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.7538728570798412e-05, + "sensitivity": 1.1713133590626483 + }, + { + "name": "model.layers.24.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.7663171901367605e-05, + "sensitivity": 0.7101762420091022 + }, + { + "name": "model.layers.24.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0003041939053218812, + "sensitivity": 1.126339760991559 + }, + { + "name": "model.layers.25.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.286647112574428e-05, + "sensitivity": 0.8471455667954055 + }, + { + "name": "model.layers.25.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.872229955159128e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0540995036717504e-05, + "sensitivity": 0.6585349612688559 + }, + { + "name": "model.layers.25.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.573334394488484e-05, + "sensitivity": 1.128326478689371 + }, + { + "name": "model.layers.25.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3334578170542954e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007252152427099645, + "sensitivity": 0.5970338713902094 + }, + { + "name": "model.layers.25.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0478672821773216e-05, + "sensitivity": 0.8327409166793602 + }, + { + "name": "model.layers.25.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.957023851507984e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.921353294979781e-05, + "sensitivity": 0.6685693729671394 + }, + { + "name": "model.layers.25.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.455922266468406e-05, + "sensitivity": 1.1424972387905736 + }, + { + "name": "model.layers.25.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.580217354392516e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000713277782779187, + "sensitivity": 0.5342946284060676 + }, + { + "name": "model.layers.25.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.12496369285509e-05, + "sensitivity": 0.8183668681277728 + }, + { + "name": "model.layers.25.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.037155569378228e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006749966996721923, + "sensitivity": 0.5563694217435456 + }, + { + "name": "model.layers.25.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.359109829645604e-05, + "sensitivity": 0.7873669092763788 + }, + { + "name": "model.layers.25.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.262935580205522e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007152028265409172, + "sensitivity": 0.5471079440340603 + }, + { + "name": "model.layers.25.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0791198292281479e-05, + "sensitivity": 1.3551873658872342 + }, + { + "name": "model.layers.25.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.332358791245497e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006213188753463328, + "sensitivity": 0.57077612676805 + }, + { + "name": "model.layers.25.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.622391472570598e-05, + "sensitivity": 1.0631425516212347 + }, + { + "name": "model.layers.25.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.76281308894977e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006373782525770366, + "sensitivity": 0.5644439969292463 + }, + { + "name": "model.layers.25.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.963730265852064e-05, + "sensitivity": 1.011722056180368 + }, + { + "name": "model.layers.25.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.297167823911877e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007766250055283308, + "sensitivity": 0.5763564746278718 + }, + { + "name": "model.layers.25.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.2678750863415189e-05, + "sensitivity": 1.5744290919975377 + }, + { + "name": "model.layers.25.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.702806439941924e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007705413154326379, + "sensitivity": 0.5658629794046814 + }, + { + "name": "model.layers.25.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0460577868798282e-05, + "sensitivity": 1.4612759304469225 + }, + { + "name": "model.layers.25.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.496520879612945e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006131215486675501, + "sensitivity": 0.5403102176327339 + }, + { + "name": "model.layers.25.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.222935917321593e-05, + "sensitivity": 0.6817713486929649 + }, + { + "name": "model.layers.25.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.961325880183722e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006979592144489288, + "sensitivity": 0.5427507159965238 + }, + { + "name": "model.layers.25.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.31205621175468e-05, + "sensitivity": 0.9853243058463192 + }, + { + "name": "model.layers.25.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.149782158601738e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.365451554302126e-05, + "sensitivity": 0.6584945790971879 + }, + { + "name": "model.layers.25.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.557085725944489e-05, + "sensitivity": 0.8987599042721266 + }, + { + "name": "model.layers.25.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.744257348145766e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007361824973486364, + "sensitivity": 0.5096820129944093 + }, + { + "name": "model.layers.25.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1074920621467754e-05, + "sensitivity": 1.2169612408709582 + }, + { + "name": "model.layers.25.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.981093403941486e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006461696466431022, + "sensitivity": 0.5621877421279358 + }, + { + "name": "model.layers.25.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.434924580389634e-05, + "sensitivity": 0.6857082110218493 + }, + { + "name": "model.layers.25.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.919032896097633e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007239067927002907, + "sensitivity": 0.5188313159768583 + }, + { + "name": "model.layers.25.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.11235445830971e-05, + "sensitivity": 1.007237311494825 + }, + { + "name": "model.layers.25.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.790399993406027e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006891667726449668, + "sensitivity": 0.554976936153453 + }, + { + "name": "model.layers.25.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.647338159382343e-05, + "sensitivity": 0.9451881267784535 + }, + { + "name": "model.layers.25.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.924977580842096e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007526649860665202, + "sensitivity": 0.5879442045453436 + }, + { + "name": "model.layers.25.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.337511538527906e-05, + "sensitivity": 0.91672442654447 + }, + { + "name": "model.layers.25.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.092075975378975e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.2231320296414196e-05, + "sensitivity": 0.624316215100591 + }, + { + "name": "model.layers.25.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.300158565863967e-05, + "sensitivity": 1.1026023513859604 + }, + { + "name": "model.layers.25.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3727953955822159e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007415349828079343, + "sensitivity": 0.5923834468009153 + }, + { + "name": "model.layers.25.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9549092839006335e-05, + "sensitivity": 0.6840087995677124 + }, + { + "name": "model.layers.25.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.096685633063316e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006694148178212345, + "sensitivity": 0.5341707799588546 + }, + { + "name": "model.layers.25.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006697954377159476, + "sensitivity": 0.5848955975805095 + }, + { + "name": "model.layers.25.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.628990488228737e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006618675542995334, + "sensitivity": 0.5440968932469578 + }, + { + "name": "model.layers.25.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.796727418783121e-05, + "sensitivity": 0.8853917652776598 + }, + { + "name": "model.layers.25.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.437384172386373e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006296419887803495, + "sensitivity": 0.5651341927498922 + }, + { + "name": "model.layers.25.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9863243222935125e-05, + "sensitivity": 0.9294461627357892 + }, + { + "name": "model.layers.25.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.530850669150823e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006784807774238288, + "sensitivity": 0.5029326532326508 + }, + { + "name": "model.layers.25.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.7675014280248433e-06, + "sensitivity": 2.0978637382936043 + }, + { + "name": "model.layers.25.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1973803566434071e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.702878115698695e-05, + "sensitivity": 0.9690958048197583 + }, + { + "name": "model.layers.25.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4322214358107885e-06, + "sensitivity": 2.0974161851797506 + }, + { + "name": "model.layers.25.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.109196644705662e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006256903288885951, + "sensitivity": 0.5683746300321879 + }, + { + "name": "model.layers.25.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.042145469109528e-05, + "sensitivity": 1.1862684309028797 + }, + { + "name": "model.layers.25.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.639827567298198e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006715126219205558, + "sensitivity": 0.5770297128297731 + }, + { + "name": "model.layers.25.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1826191439467948e-05, + "sensitivity": 1.2708028899879098 + }, + { + "name": "model.layers.25.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.918103281350341e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007063332013785839, + "sensitivity": 0.5500600021803825 + }, + { + "name": "model.layers.25.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9420923207653686e-05, + "sensitivity": 1.0949579106828966 + }, + { + "name": "model.layers.25.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.541110562669928e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.889019666938111e-05, + "sensitivity": 0.788751412502666 + }, + { + "name": "model.layers.25.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.2414244338287972e-05, + "sensitivity": 1.3477447019808597 + }, + { + "name": "model.layers.25.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0329163160349708e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.794578803237528e-05, + "sensitivity": 0.7557453314070244 + }, + { + "name": "model.layers.25.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7458324590697885e-05, + "sensitivity": 1.0266821943370958 + }, + { + "name": "model.layers.25.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.072519340705185e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006467581260949373, + "sensitivity": 0.5230792312805237 + }, + { + "name": "model.layers.25.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.516865687444806e-05, + "sensitivity": 0.7404344050137536 + }, + { + "name": "model.layers.25.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.505211669922573e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007447988609783351, + "sensitivity": 0.5306202899400626 + }, + { + "name": "model.layers.25.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0121468221768737e-05, + "sensitivity": 1.9109391866083592 + }, + { + "name": "model.layers.25.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.631268891193031e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.468084054882638e-05, + "sensitivity": 0.6531271462115653 + }, + { + "name": "model.layers.25.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8144269132753834e-05, + "sensitivity": 0.8232349463579154 + }, + { + "name": "model.layers.25.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.487388759524038e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006441447767429054, + "sensitivity": 0.5401508475229917 + }, + { + "name": "model.layers.25.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.063318141968921e-05, + "sensitivity": 1.1354171190244817 + }, + { + "name": "model.layers.25.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.367643999918073e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000668938853777945, + "sensitivity": 0.5718355543051027 + }, + { + "name": "model.layers.25.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.258355278987437e-05, + "sensitivity": 0.8093694569195755 + }, + { + "name": "model.layers.25.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.359757094287488e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006977439625188708, + "sensitivity": 0.5252835715037875 + }, + { + "name": "model.layers.25.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.911683547310531e-05, + "sensitivity": 0.7730472237933786 + }, + { + "name": "model.layers.25.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.601362881359819e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000648645160254091, + "sensitivity": 0.526662005956213 + }, + { + "name": "model.layers.25.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.6218308347743e-05, + "sensitivity": 0.9470506699484725 + }, + { + "name": "model.layers.25.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.834588243189501e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.557442247867584e-05, + "sensitivity": 0.7874369602931846 + }, + { + "name": "model.layers.25.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8136363804806024e-05, + "sensitivity": 0.9714307034032273 + }, + { + "name": "model.layers.25.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.781023103030748e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006237979396246374, + "sensitivity": 0.5588348675745913 + }, + { + "name": "model.layers.25.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.400638812920079e-05, + "sensitivity": 0.6705446522226461 + }, + { + "name": "model.layers.25.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.34069260488468e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007089774007909, + "sensitivity": 0.5283967094688902 + }, + { + "name": "model.layers.25.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.907401646254584e-05, + "sensitivity": 0.8378535603218288 + }, + { + "name": "model.layers.25.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.26877260603942e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006374302320182323, + "sensitivity": 0.5227986745868392 + }, + { + "name": "model.layers.25.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1679816452669911e-05, + "sensitivity": 1.6965336981590313 + }, + { + "name": "model.layers.25.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.044552618623129e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.039203071850352e-05, + "sensitivity": 0.663138489943017 + }, + { + "name": "model.layers.25.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.849884473718703e-05, + "sensitivity": 1.0152064993128305 + }, + { + "name": "model.layers.25.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.248533281905111e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006589896511286497, + "sensitivity": 0.5410411702998772 + }, + { + "name": "model.layers.25.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.337130616884679e-05, + "sensitivity": 0.854042851828322 + }, + { + "name": "model.layers.25.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.681322588519834e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000716469599865377, + "sensitivity": 0.5239112077287971 + }, + { + "name": "model.layers.25.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.162043428048491e-05, + "sensitivity": 1.0059627554488983 + }, + { + "name": "model.layers.25.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.618364179506898e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.829898873344064e-05, + "sensitivity": 0.7489536608692579 + }, + { + "name": "model.layers.25.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1912498848687392e-05, + "sensitivity": 1.2104026613334729 + }, + { + "name": "model.layers.25.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0199846656178124e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007224151631817222, + "sensitivity": 0.540130739219115 + }, + { + "name": "model.layers.25.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.623871740885079e-05, + "sensitivity": 1.1235654188204687 + }, + { + "name": "model.layers.25.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.463877409463748e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007401038310490549, + "sensitivity": 0.5518693758939852 + }, + { + "name": "model.layers.25.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0035367267846595e-05, + "sensitivity": 1.354559530513249 + }, + { + "name": "model.layers.25.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.783334356441628e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005940498667769134, + "sensitivity": 0.5393961992856359 + }, + { + "name": "model.layers.25.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.171649147290736e-05, + "sensitivity": 1.1526188464160165 + }, + { + "name": "model.layers.25.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.514349249504448e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9292731748428196e-05, + "sensitivity": 0.6069086859657767 + }, + { + "name": "model.layers.25.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.932112253503874e-05, + "sensitivity": 0.959065415223597 + }, + { + "name": "model.layers.25.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.540376489283517e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006403631996363401, + "sensitivity": 0.5259463446766097 + }, + { + "name": "model.layers.25.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.261478119995445e-05, + "sensitivity": 0.8403145748414178 + }, + { + "name": "model.layers.25.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.913360266480595e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006817596731707454, + "sensitivity": 0.5908329276900521 + }, + { + "name": "model.layers.25.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.676748332916759e-05, + "sensitivity": 0.9488072045020128 + }, + { + "name": "model.layers.25.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.761993063264526e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006417943513952196, + "sensitivity": 0.5200728360029869 + }, + { + "name": "model.layers.25.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0705664509441704e-05, + "sensitivity": 0.6144474133901939 + }, + { + "name": "model.layers.25.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.655217248408007e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006721611134707928, + "sensitivity": 0.5382416665000487 + }, + { + "name": "model.layers.25.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.098694610845996e-05, + "sensitivity": 1.4342837308105125 + }, + { + "name": "model.layers.25.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.928292913878977e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006688893772661686, + "sensitivity": 0.5327018465554424 + }, + { + "name": "model.layers.25.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.179852789500728e-05, + "sensitivity": 1.1160128133976237 + }, + { + "name": "model.layers.25.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.74848649850901e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006896787672303617, + "sensitivity": 0.5516972513901114 + }, + { + "name": "model.layers.25.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.28921092255041e-05, + "sensitivity": 1.8813081953607635 + }, + { + "name": "model.layers.25.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.406561503055855e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.135453051887453e-05, + "sensitivity": 0.9816958375619692 + }, + { + "name": "model.layers.25.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4605019461887423e-06, + "sensitivity": 2.0974626367758162 + }, + { + "name": "model.layers.25.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0514595487620682e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.762394721386954e-05, + "sensitivity": 0.842897219038038 + }, + { + "name": "model.layers.25.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1097482456534635e-05, + "sensitivity": 1.7321853496400759 + }, + { + "name": "model.layers.25.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.638290071554366e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006353583885356784, + "sensitivity": 0.5441144175113565 + }, + { + "name": "model.layers.25.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8275862102163956e-05, + "sensitivity": 0.6985646976494273 + }, + { + "name": "model.layers.25.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.333352189358266e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.801986117148772e-05, + "sensitivity": 0.6767515188787182 + }, + { + "name": "model.layers.25.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.822164530400187e-05, + "sensitivity": 1.0966781033818414 + }, + { + "name": "model.layers.25.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.608567441115156e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006657672929577529, + "sensitivity": 0.511201281172172 + }, + { + "name": "model.layers.25.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.917781891184859e-05, + "sensitivity": 0.8401066248136622 + }, + { + "name": "model.layers.25.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.080526873120107e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8453366364119574e-05, + "sensitivity": 0.7581092417365517 + }, + { + "name": "model.layers.25.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0660903171810787e-05, + "sensitivity": 1.4999863172859003 + }, + { + "name": "model.layers.25.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.54994220592198e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6482396757928655e-05, + "sensitivity": 0.8035750886427779 + }, + { + "name": "model.layers.25.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.283951370278373e-05, + "sensitivity": 1.0384848794160542 + }, + { + "name": "model.layers.25.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.231818699438008e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007021225756034255, + "sensitivity": 0.5951085137538634 + }, + { + "name": "model.layers.25.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.861831207061186e-05, + "sensitivity": 0.8012852605586506 + }, + { + "name": "model.layers.25.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.692386472830549e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007526848348788917, + "sensitivity": 0.5968363994876065 + }, + { + "name": "model.layers.25.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 4.615264060703339e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3618731574970298e-06, + "sensitivity": 2.101032065467826 + }, + { + "name": "model.layers.25.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.75916009338107e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.25.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 8.72218151926063e-06, + "sensitivity": 1.5931799251240129 + }, + { + "name": "model.layers.25.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 3.307317820144817e-05, + "sensitivity": 1.942572236694549 + }, + { + "name": "model.layers.25.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00019686020095832646, + "sensitivity": 0.9417370857786393 + }, + { + "name": "model.layers.25.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.448577950213803e-05, + "sensitivity": 1.4305350851324847 + }, + { + "name": "model.layers.25.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 2, + "mse": 0.0006520400638692081, + "sensitivity": 0.5561367319595021 + }, + { + "name": "model.layers.25.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0003004151221830398, + "sensitivity": 0.7192584828288666 + }, + { + "name": "model.layers.26.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007007308304309845, + "sensitivity": 0.5773103954841726 + }, + { + "name": "model.layers.26.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.922249440322048e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006826593307778239, + "sensitivity": 0.51516205027222 + }, + { + "name": "model.layers.26.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.494693661807105e-05, + "sensitivity": 0.9957751843989924 + }, + { + "name": "model.layers.26.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.049514121921675e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007489453419111669, + "sensitivity": 0.5343168857398419 + }, + { + "name": "model.layers.26.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.997002881485969e-05, + "sensitivity": 1.0888956555863443 + }, + { + "name": "model.layers.26.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.736587122053606e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006723866099491715, + "sensitivity": 0.5520143362242681 + }, + { + "name": "model.layers.26.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0447851309436373e-05, + "sensitivity": 1.8484316306338198 + }, + { + "name": "model.layers.26.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.119775773389847e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.4180236475076526e-05, + "sensitivity": 0.6009714906706488 + }, + { + "name": "model.layers.26.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.743294605053961e-05, + "sensitivity": 0.6661311707551536 + }, + { + "name": "model.layers.26.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.041889489300956e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006308346055448055, + "sensitivity": 0.5415496082601963 + }, + { + "name": "model.layers.26.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.109551759436727e-05, + "sensitivity": 1.0661647975559223 + }, + { + "name": "model.layers.26.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.836232273599308e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006897434359416366, + "sensitivity": 0.5652756159574523 + }, + { + "name": "model.layers.26.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.730098200729117e-05, + "sensitivity": 1.1180043391177226 + }, + { + "name": "model.layers.26.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.490895430033561e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006433876696974039, + "sensitivity": 0.5387871228685892 + }, + { + "name": "model.layers.26.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8324811107013375e-05, + "sensitivity": 1.146074155343634 + }, + { + "name": "model.layers.26.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.613256005039148e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006714092451147735, + "sensitivity": 0.5076094455556991 + }, + { + "name": "model.layers.26.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.840799323981628e-05, + "sensitivity": 0.8394437202469865 + }, + { + "name": "model.layers.26.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.822217753528093e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007896681781858206, + "sensitivity": 0.5925955523212638 + }, + { + "name": "model.layers.26.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.946693636360578e-05, + "sensitivity": 0.7061378660002118 + }, + { + "name": "model.layers.26.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.725131349114235e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006610815762542188, + "sensitivity": 0.5311022320588861 + }, + { + "name": "model.layers.26.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5147247621789575e-05, + "sensitivity": 0.8455867481507442 + }, + { + "name": "model.layers.26.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.446809379667684e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006240512011572719, + "sensitivity": 0.5333685417381823 + }, + { + "name": "model.layers.26.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.122437869431451e-05, + "sensitivity": 0.9504782268020985 + }, + { + "name": "model.layers.26.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.343528073353809e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005791670409962535, + "sensitivity": 0.5396502073222493 + }, + { + "name": "model.layers.26.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1802845619968139e-05, + "sensitivity": 1.6313755662173586 + }, + { + "name": "model.layers.26.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0847852536244318e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006850893842056394, + "sensitivity": 0.5696056730264061 + }, + { + "name": "model.layers.26.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.025598612613976e-05, + "sensitivity": 1.5175121089145367 + }, + { + "name": "model.layers.26.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.183715524661238e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006164765218272805, + "sensitivity": 0.5271726884645341 + }, + { + "name": "model.layers.26.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.927102392888628e-05, + "sensitivity": 0.749770497812392 + }, + { + "name": "model.layers.26.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.381018238243996e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006613103905692697, + "sensitivity": 0.5381260922371971 + }, + { + "name": "model.layers.26.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.374707299983129e-05, + "sensitivity": 0.6203640327993435 + }, + { + "name": "model.layers.26.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.861178007966373e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007295961841009557, + "sensitivity": 0.5474890893073727 + }, + { + "name": "model.layers.26.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.026610243570758e-05, + "sensitivity": 1.2536853950603322 + }, + { + "name": "model.layers.26.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.4169280373535e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6732089433353394e-05, + "sensitivity": 0.6953680475033642 + }, + { + "name": "model.layers.26.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.403741281246766e-05, + "sensitivity": 0.6257804485384524 + }, + { + "name": "model.layers.26.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.017271054290177e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007121781818568707, + "sensitivity": 0.540907720495388 + }, + { + "name": "model.layers.26.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8892845117952675e-05, + "sensitivity": 0.9934968204255141 + }, + { + "name": "model.layers.26.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.719297971358174e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006369092734530568, + "sensitivity": 0.5641537739688777 + }, + { + "name": "model.layers.26.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.821870217914693e-05, + "sensitivity": 0.9481442407714711 + }, + { + "name": "model.layers.26.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.440008857884095e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006593175930902362, + "sensitivity": 0.5189045181066165 + }, + { + "name": "model.layers.26.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4539758669561706e-06, + "sensitivity": 2.097500271719418 + }, + { + "name": "model.layers.26.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3739788755628979e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.4762145737186074e-05, + "sensitivity": 0.8009288227365433 + }, + { + "name": "model.layers.26.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.33706949884072e-05, + "sensitivity": 0.8969954246973174 + }, + { + "name": "model.layers.26.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.610607776266988e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000700620177667588, + "sensitivity": 0.5363925268029777 + }, + { + "name": "model.layers.26.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7146549806930125e-05, + "sensitivity": 0.7615099366982612 + }, + { + "name": "model.layers.26.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.891072530379461e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006356819067150354, + "sensitivity": 0.5403539982920995 + }, + { + "name": "model.layers.26.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.854754610685632e-05, + "sensitivity": 0.7480215177072145 + }, + { + "name": "model.layers.26.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.194596148314304e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007931017316877842, + "sensitivity": 0.5716835376979057 + }, + { + "name": "model.layers.26.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.870885433978401e-05, + "sensitivity": 1.070076537501205 + }, + { + "name": "model.layers.26.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.255351874846383e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006672201561741531, + "sensitivity": 0.5288018868547831 + }, + { + "name": "model.layers.26.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4532437237212434e-06, + "sensitivity": 2.0971968422820995 + }, + { + "name": "model.layers.26.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.514305823657196e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006610476411879063, + "sensitivity": 0.5737053930284097 + }, + { + "name": "model.layers.26.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.852452522958629e-05, + "sensitivity": 0.9742023955881975 + }, + { + "name": "model.layers.26.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.490027087442286e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7144672609865665e-05, + "sensitivity": 0.6384735295058241 + }, + { + "name": "model.layers.26.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.429819040931761e-05, + "sensitivity": 1.123827473644933 + }, + { + "name": "model.layers.26.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.083004215426627e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007192158373072743, + "sensitivity": 0.5917919361627515 + }, + { + "name": "model.layers.26.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0525759181473404e-05, + "sensitivity": 0.8901392433179144 + }, + { + "name": "model.layers.26.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0460003068146762e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006799520342610776, + "sensitivity": 0.5474172387340495 + }, + { + "name": "model.layers.26.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.252655293792486e-05, + "sensitivity": 0.9646515316474938 + }, + { + "name": "model.layers.26.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.459434527845588e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006882669404149055, + "sensitivity": 0.5330408502299124 + }, + { + "name": "model.layers.26.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.410731293726712e-05, + "sensitivity": 0.8818156597715803 + }, + { + "name": "model.layers.26.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.920179309119703e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007077368791215122, + "sensitivity": 0.557013759676577 + }, + { + "name": "model.layers.26.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.293944898061454e-05, + "sensitivity": 0.6160327572461622 + }, + { + "name": "model.layers.26.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.997184863801522e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007040548953227699, + "sensitivity": 0.5274621985797522 + }, + { + "name": "model.layers.26.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1285452274023555e-05, + "sensitivity": 1.636799496861495 + }, + { + "name": "model.layers.26.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.504160859956755e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006848671473562717, + "sensitivity": 0.5137228982716278 + }, + { + "name": "model.layers.26.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.987211625324562e-05, + "sensitivity": 0.7503984092907282 + }, + { + "name": "model.layers.26.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.147266387619311e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006635044701397419, + "sensitivity": 0.5223547291368078 + }, + { + "name": "model.layers.26.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8292811445426196e-05, + "sensitivity": 0.8535857909594626 + }, + { + "name": "model.layers.26.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.172399586532265e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006488862563855946, + "sensitivity": 0.5187574136491341 + }, + { + "name": "model.layers.26.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7008037401828915e-05, + "sensitivity": 0.6607011377730527 + }, + { + "name": "model.layers.26.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.081651804379362e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000639228499494493, + "sensitivity": 0.5281131245318267 + }, + { + "name": "model.layers.26.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1334846021782141e-05, + "sensitivity": 1.3476312737522704 + }, + { + "name": "model.layers.26.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.904280548449606e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006778526003472507, + "sensitivity": 0.5974220955672687 + }, + { + "name": "model.layers.26.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1016533790098038e-05, + "sensitivity": 1.7832982831628232 + }, + { + "name": "model.layers.26.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.431939247406262e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006674609030596912, + "sensitivity": 0.5767625735124704 + }, + { + "name": "model.layers.26.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0342572750232648e-05, + "sensitivity": 1.3413954059640778 + }, + { + "name": "model.layers.26.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.276616997842211e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006198016926646233, + "sensitivity": 0.5464895541119174 + }, + { + "name": "model.layers.26.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1058862583013251e-05, + "sensitivity": 1.5794480077576944 + }, + { + "name": "model.layers.26.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2308348686929094e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.717131352867e-05, + "sensitivity": 0.6055437927672602 + }, + { + "name": "model.layers.26.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.968813249841332e-05, + "sensitivity": 0.7826825503936196 + }, + { + "name": "model.layers.26.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3527358078135876e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000779744703322649, + "sensitivity": 0.5591465040025525 + }, + { + "name": "model.layers.26.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.925360164837912e-05, + "sensitivity": 1.1250238466498101 + }, + { + "name": "model.layers.26.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4186114185577026e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6992063036886975e-05, + "sensitivity": 0.7780466636854336 + }, + { + "name": "model.layers.26.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.502835847437382e-05, + "sensitivity": 0.886137305129233 + }, + { + "name": "model.layers.26.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.888290045026224e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006199441268108785, + "sensitivity": 0.5696660474839033 + }, + { + "name": "model.layers.26.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.983981100143865e-05, + "sensitivity": 1.068725652929743 + }, + { + "name": "model.layers.26.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.31129318864987e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8047597121912986e-05, + "sensitivity": 0.8691835449653275 + }, + { + "name": "model.layers.26.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.04926681262441e-05, + "sensitivity": 0.6656224731767797 + }, + { + "name": "model.layers.26.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.634088206032175e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00066728750243783, + "sensitivity": 0.5164341496143652 + }, + { + "name": "model.layers.26.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.108822708483785e-05, + "sensitivity": 0.8994951328998599 + }, + { + "name": "model.layers.26.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.867962151271058e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.008036871207878e-05, + "sensitivity": 0.6381249711729056 + }, + { + "name": "model.layers.26.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.068296715966426e-05, + "sensitivity": 0.8309177849770765 + }, + { + "name": "model.layers.26.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.9453169493936e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.944628719589673e-05, + "sensitivity": 0.6241201601428317 + }, + { + "name": "model.layers.26.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8695026382338256e-05, + "sensitivity": 0.6162294712324463 + }, + { + "name": "model.layers.26.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.835137007030426e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006616695318371058, + "sensitivity": 0.5354274121599369 + }, + { + "name": "model.layers.26.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.971203790977597e-05, + "sensitivity": 0.739914914323999 + }, + { + "name": "model.layers.26.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.643673486905755e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006641644868068397, + "sensitivity": 0.5275381009133806 + }, + { + "name": "model.layers.26.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.648268036864465e-06, + "sensitivity": 2.0211862783162826 + }, + { + "name": "model.layers.26.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.986463282984914e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.508063233923167e-05, + "sensitivity": 0.6385563386622441 + }, + { + "name": "model.layers.26.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0568035577307455e-05, + "sensitivity": 1.8983488337788532 + }, + { + "name": "model.layers.26.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.68668473433354e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006395919481292367, + "sensitivity": 0.5406928877771322 + }, + { + "name": "model.layers.26.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.876376962987706e-05, + "sensitivity": 0.7891032467426481 + }, + { + "name": "model.layers.26.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.524720674860873e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006512111867778003, + "sensitivity": 0.5243822804852416 + }, + { + "name": "model.layers.26.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.204770033946261e-05, + "sensitivity": 0.8407429944419533 + }, + { + "name": "model.layers.26.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.743633432255592e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006865378236398101, + "sensitivity": 0.5575558262629976 + }, + { + "name": "model.layers.26.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006220788927748799, + "sensitivity": 0.5981480719612228 + }, + { + "name": "model.layers.26.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.280528168645105e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006269393488764763, + "sensitivity": 0.5098885095615602 + }, + { + "name": "model.layers.26.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.139402103144675e-05, + "sensitivity": 0.7215968811919413 + }, + { + "name": "model.layers.26.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.4223197543688e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007016627350822091, + "sensitivity": 0.5309104917845455 + }, + { + "name": "model.layers.26.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0670994015526958e-05, + "sensitivity": 1.2511312019689906 + }, + { + "name": "model.layers.26.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.746031880946248e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006563750794157386, + "sensitivity": 0.5476073091812773 + }, + { + "name": "model.layers.26.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.2894523024442606e-05, + "sensitivity": 1.4521395447324248 + }, + { + "name": "model.layers.26.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.734033940527297e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008174054673872888, + "sensitivity": 0.5807115751074979 + }, + { + "name": "model.layers.26.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.901339682168327e-05, + "sensitivity": 0.7594414767316222 + }, + { + "name": "model.layers.26.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.220046427391935e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006497324211522937, + "sensitivity": 0.5170585439744774 + }, + { + "name": "model.layers.26.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.162439240142703e-05, + "sensitivity": 0.8055247983949736 + }, + { + "name": "model.layers.26.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.442383088753559e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.139279139460996e-05, + "sensitivity": 0.7063777500625144 + }, + { + "name": "model.layers.26.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.078993227565661e-05, + "sensitivity": 1.720789838217995 + }, + { + "name": "model.layers.26.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.555510481121019e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006535305874422193, + "sensitivity": 0.524243304308953 + }, + { + "name": "model.layers.26.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.356679659802467e-05, + "sensitivity": 0.907474136830013 + }, + { + "name": "model.layers.26.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.796619231863588e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007264696760103106, + "sensitivity": 0.57222064381686 + }, + { + "name": "model.layers.26.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9224970755167305e-05, + "sensitivity": 0.6919700696071359 + }, + { + "name": "model.layers.26.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.444435823344975e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006548903184011579, + "sensitivity": 0.5442624245362361 + }, + { + "name": "model.layers.26.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.057304563000798e-05, + "sensitivity": 0.9894751062733376 + }, + { + "name": "model.layers.26.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.12793394086475e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006722828256897628, + "sensitivity": 0.5310960260202929 + }, + { + "name": "model.layers.26.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.050320735084824e-05, + "sensitivity": 0.755330495189909 + }, + { + "name": "model.layers.26.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0134120884686126e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006652991287410259, + "sensitivity": 0.5190852017284493 + }, + { + "name": "model.layers.26.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 3.9943415686138906e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.520831458241446e-06, + "sensitivity": 2.101308569190747 + }, + { + "name": "model.layers.26.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.758581770962337e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.26.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 8.589102435507812e-06, + "sensitivity": 1.5537654504761338 + }, + { + "name": "model.layers.26.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 3.87376821890939e-05, + "sensitivity": 1.8683685828649303 + }, + { + "name": "model.layers.26.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00017956329975277185, + "sensitivity": 0.995086997359052 + }, + { + "name": "model.layers.26.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.7036092685884796e-05, + "sensitivity": 0.814660240193715 + }, + { + "name": "model.layers.26.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 2, + "mse": 0.0006765212747268379, + "sensitivity": 0.5175334307332194 + }, + { + "name": "model.layers.26.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00025791715597733855, + "sensitivity": 0.6915713636909062 + }, + { + "name": "model.layers.27.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.384942389559001e-05, + "sensitivity": 0.6470266695895885 + }, + { + "name": "model.layers.27.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.740476917206252e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007095946930348873, + "sensitivity": 0.555704632122844 + }, + { + "name": "model.layers.27.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.642623727908358e-05, + "sensitivity": 0.6827860188874171 + }, + { + "name": "model.layers.27.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.292598525054927e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006332519114948809, + "sensitivity": 0.5325993427234137 + }, + { + "name": "model.layers.27.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.868554191896692e-05, + "sensitivity": 0.7302426792072144 + }, + { + "name": "model.layers.27.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2064905376973911e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008054152131080627, + "sensitivity": 0.5650284706422344 + }, + { + "name": "model.layers.27.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.476628186646849e-05, + "sensitivity": 0.7947266626709241 + }, + { + "name": "model.layers.27.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.502703738282435e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.343161658151075e-05, + "sensitivity": 0.6212420711593487 + }, + { + "name": "model.layers.27.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6375192798441276e-05, + "sensitivity": 0.7518604015650971 + }, + { + "name": "model.layers.27.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.761165647934831e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006241984665393829, + "sensitivity": 0.5298102759211607 + }, + { + "name": "model.layers.27.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.822989623993635e-05, + "sensitivity": 0.7010153279226249 + }, + { + "name": "model.layers.27.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.667352749900601e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.020569708198309e-05, + "sensitivity": 0.6057938044302839 + }, + { + "name": "model.layers.27.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.363321982556954e-06, + "sensitivity": 2.0970905973744047 + }, + { + "name": "model.layers.27.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.999322863521229e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.79564475629013e-05, + "sensitivity": 0.6959552300138085 + }, + { + "name": "model.layers.27.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.124279752839357e-05, + "sensitivity": 0.6087507597349605 + }, + { + "name": "model.layers.27.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.902975767137832e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00068462616764009, + "sensitivity": 0.5534448675267053 + }, + { + "name": "model.layers.27.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.2058184438501485e-05, + "sensitivity": 1.3461696849105407 + }, + { + "name": "model.layers.27.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0831686267920304e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007221346022561193, + "sensitivity": 0.5922445621209058 + }, + { + "name": "model.layers.27.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.360869156196713e-05, + "sensitivity": 0.8446105697236841 + }, + { + "name": "model.layers.27.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.690287364108372e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007095012697391212, + "sensitivity": 0.5314148658292116 + }, + { + "name": "model.layers.27.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.289671728154644e-05, + "sensitivity": 0.8603391390507547 + }, + { + "name": "model.layers.27.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.103948173105891e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007050613639876246, + "sensitivity": 0.5248433410884411 + }, + { + "name": "model.layers.27.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007164645940065384, + "sensitivity": 0.5923436166488477 + }, + { + "name": "model.layers.27.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.874838049952814e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007372416439466178, + "sensitivity": 0.581478708241838 + }, + { + "name": "model.layers.27.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.849138688063249e-05, + "sensitivity": 1.0659964264066075 + }, + { + "name": "model.layers.27.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.753326028454467e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006446281331591308, + "sensitivity": 0.5568772932167468 + }, + { + "name": "model.layers.27.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9006350056733936e-05, + "sensitivity": 0.6435032259897163 + }, + { + "name": "model.layers.27.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.293564294741373e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006757780793122947, + "sensitivity": 0.5139642741819704 + }, + { + "name": "model.layers.27.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9676196542568505e-05, + "sensitivity": 0.6621761778009396 + }, + { + "name": "model.layers.27.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.07595518179005e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006712016183882952, + "sensitivity": 0.5404049112478777 + }, + { + "name": "model.layers.27.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006572530837729573, + "sensitivity": 0.5663303489281847 + }, + { + "name": "model.layers.27.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.00596308686363e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000651884765829891, + "sensitivity": 0.522777622674848 + }, + { + "name": "model.layers.27.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.077232344774529e-05, + "sensitivity": 0.7372235884399145 + }, + { + "name": "model.layers.27.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.66835865356552e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005989265046082437, + "sensitivity": 0.520937873586018 + }, + { + "name": "model.layers.27.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006516270223073661, + "sensitivity": 0.5722470722076106 + }, + { + "name": "model.layers.27.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.78013145463774e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006652704323641956, + "sensitivity": 0.5277171724902437 + }, + { + "name": "model.layers.27.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.292153557296842e-05, + "sensitivity": 0.9125960401817063 + }, + { + "name": "model.layers.27.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.208967645055964e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007129345322027802, + "sensitivity": 0.5119475417974205 + }, + { + "name": "model.layers.27.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.972729923087172e-05, + "sensitivity": 1.048058890054307 + }, + { + "name": "model.layers.27.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.318757747678319e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006691188318654895, + "sensitivity": 0.5943031627275932 + }, + { + "name": "model.layers.27.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.422310252673924e-05, + "sensitivity": 0.6284361869446151 + }, + { + "name": "model.layers.27.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.122141028048645e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007417702581733465, + "sensitivity": 0.5461424543763086 + }, + { + "name": "model.layers.27.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1253799129917752e-05, + "sensitivity": 1.4070632954399063 + }, + { + "name": "model.layers.27.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.031011364233564e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006810346385464072, + "sensitivity": 0.5853975783394711 + }, + { + "name": "model.layers.27.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8795223594643176e-05, + "sensitivity": 0.9736073550263282 + }, + { + "name": "model.layers.27.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.538066372741014e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00066421739757061, + "sensitivity": 0.5420263302412424 + }, + { + "name": "model.layers.27.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.805718683404848e-05, + "sensitivity": 0.7099313250576189 + }, + { + "name": "model.layers.27.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.717152357145096e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006543698254972696, + "sensitivity": 0.5375193295575428 + }, + { + "name": "model.layers.27.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.125729123596102e-05, + "sensitivity": 0.7403609161363012 + }, + { + "name": "model.layers.27.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.595724014208827e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006544270436279476, + "sensitivity": 0.5501699940643386 + }, + { + "name": "model.layers.27.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1006060958607122e-05, + "sensitivity": 1.392130303156212 + }, + { + "name": "model.layers.27.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1664914154607686e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.830282316310331e-05, + "sensitivity": 0.7122747572809305 + }, + { + "name": "model.layers.27.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1211372111574747e-05, + "sensitivity": 1.2197691108910969 + }, + { + "name": "model.layers.27.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.458983191099833e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8286357671022415e-05, + "sensitivity": 0.9451437107221338 + }, + { + "name": "model.layers.27.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.614034646190703e-05, + "sensitivity": 0.8422466985806579 + }, + { + "name": "model.layers.27.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.95206278275873e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007361894240602851, + "sensitivity": 0.5264628707160204 + }, + { + "name": "model.layers.27.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.172547000460327e-05, + "sensitivity": 0.9257807293254767 + }, + { + "name": "model.layers.27.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3320975540409563e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006792682106606662, + "sensitivity": 0.553119752144999 + }, + { + "name": "model.layers.27.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.479403519828338e-06, + "sensitivity": 2.0970519270363943 + }, + { + "name": "model.layers.27.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.064128221325518e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006763099227100611, + "sensitivity": 0.5496228028495056 + }, + { + "name": "model.layers.27.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7816207117866725e-05, + "sensitivity": 0.6337871055569014 + }, + { + "name": "model.layers.27.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.781809472362511e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006503866752609611, + "sensitivity": 0.5549517762863696 + }, + { + "name": "model.layers.27.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.027934068697505e-05, + "sensitivity": 0.6129501885254899 + }, + { + "name": "model.layers.27.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.778946269354492e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006879507564008236, + "sensitivity": 0.5356812815037768 + }, + { + "name": "model.layers.27.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.029051655787043e-05, + "sensitivity": 1.0706407750024676 + }, + { + "name": "model.layers.27.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.065275096669211e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006839300040155649, + "sensitivity": 0.5339190356078701 + }, + { + "name": "model.layers.27.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0295453295111656e-05, + "sensitivity": 0.7335443146568597 + }, + { + "name": "model.layers.27.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.443141723546432e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006816661916673183, + "sensitivity": 0.5460800670814949 + }, + { + "name": "model.layers.27.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.834179319208488e-05, + "sensitivity": 0.7740231505244342 + }, + { + "name": "model.layers.27.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.265693173190812e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006590489065274596, + "sensitivity": 0.5030929982149938 + }, + { + "name": "model.layers.27.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7815268519334495e-05, + "sensitivity": 0.6567396142634357 + }, + { + "name": "model.layers.27.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.534965220656886e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006578967440873384, + "sensitivity": 0.5153308246690461 + }, + { + "name": "model.layers.27.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.564966704696417e-05, + "sensitivity": 0.9931195557988537 + }, + { + "name": "model.layers.27.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.150376066216268e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006399505655281246, + "sensitivity": 0.5517405155931466 + }, + { + "name": "model.layers.27.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.842160317115486e-05, + "sensitivity": 0.9321401237216101 + }, + { + "name": "model.layers.27.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.363786155816342e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006506257341243327, + "sensitivity": 0.5455580876355213 + }, + { + "name": "model.layers.27.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1292246199445799e-05, + "sensitivity": 1.2701585965846582 + }, + { + "name": "model.layers.27.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1427478057157714e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.153671711217612e-05, + "sensitivity": 0.7317459702728198 + }, + { + "name": "model.layers.27.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007406770600937307, + "sensitivity": 0.5747099633201722 + }, + { + "name": "model.layers.27.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.573866464052116e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007522301748394966, + "sensitivity": 0.5810859913742512 + }, + { + "name": "model.layers.27.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.199054066906683e-05, + "sensitivity": 0.741022700835067 + }, + { + "name": "model.layers.27.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.742003850173205e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006125321378931403, + "sensitivity": 0.530466668122792 + }, + { + "name": "model.layers.27.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1502159395604394e-05, + "sensitivity": 1.4735509324971787 + }, + { + "name": "model.layers.27.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.815812861939776e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006827967590652406, + "sensitivity": 0.5333204508135629 + }, + { + "name": "model.layers.27.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.926302037551068e-05, + "sensitivity": 0.8900549183220812 + }, + { + "name": "model.layers.27.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.560261110484134e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.820286605739966e-05, + "sensitivity": 0.6871348149170888 + }, + { + "name": "model.layers.27.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.991708530928008e-05, + "sensitivity": 0.9436072957356295 + }, + { + "name": "model.layers.27.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.703047231188975e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.012379890307784e-05, + "sensitivity": 0.6313819475175239 + }, + { + "name": "model.layers.27.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.1011320212855935e-05, + "sensitivity": 0.7764919973371954 + }, + { + "name": "model.layers.27.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.579635277783382e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0016154748154804e-05, + "sensitivity": 0.6715777666901775 + }, + { + "name": "model.layers.27.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.094970376580022e-05, + "sensitivity": 0.8549986386836548 + }, + { + "name": "model.layers.27.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6447260122731677e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.047650094842538e-05, + "sensitivity": 0.786721266890773 + }, + { + "name": "model.layers.27.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.011294317431748e-05, + "sensitivity": 0.8003000557510581 + }, + { + "name": "model.layers.27.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.069556318128889e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007085083052515984, + "sensitivity": 0.5338846265200456 + }, + { + "name": "model.layers.27.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1410392289690208e-05, + "sensitivity": 1.600367343713598 + }, + { + "name": "model.layers.27.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.051226020848844e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006981290644034743, + "sensitivity": 0.5155833364470346 + }, + { + "name": "model.layers.27.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.951302591711283e-05, + "sensitivity": 0.612576356416924 + }, + { + "name": "model.layers.27.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.908679779371596e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006668507121503353, + "sensitivity": 0.5275179552618658 + }, + { + "name": "model.layers.27.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0211018889094703e-05, + "sensitivity": 1.44018179834609 + }, + { + "name": "model.layers.27.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.249236091411149e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.694985156878829e-05, + "sensitivity": 0.642853422475003 + }, + { + "name": "model.layers.27.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.523270712932572e-05, + "sensitivity": 0.7531900645993648 + }, + { + "name": "model.layers.27.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.607888387108687e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.543614290421829e-05, + "sensitivity": 0.6161770366373405 + }, + { + "name": "model.layers.27.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.482606113422662e-05, + "sensitivity": 1.133363156556828 + }, + { + "name": "model.layers.27.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.308419753826456e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000725594989489764, + "sensitivity": 0.5692650309442827 + }, + { + "name": "model.layers.27.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.150025728857145e-05, + "sensitivity": 0.7206207370411886 + }, + { + "name": "model.layers.27.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.390909099238343e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000687071995344013, + "sensitivity": 0.53869119430384 + }, + { + "name": "model.layers.27.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.989425699226558e-05, + "sensitivity": 0.828870731865391 + }, + { + "name": "model.layers.27.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.405242510889366e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006657940102741122, + "sensitivity": 0.5425151787579583 + }, + { + "name": "model.layers.27.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3830532427382423e-06, + "sensitivity": 2.0972365605468912 + }, + { + "name": "model.layers.27.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.025142296384729e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.816239718114957e-05, + "sensitivity": 0.6091171092510885 + }, + { + "name": "model.layers.27.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3869087423663586e-05, + "sensitivity": 0.9522800234540035 + }, + { + "name": "model.layers.27.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.263416819114354e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006393005605787039, + "sensitivity": 0.5610410816766879 + }, + { + "name": "model.layers.27.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1341496247041505e-05, + "sensitivity": 1.2471781758916425 + }, + { + "name": "model.layers.27.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.2218118652454e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007247984176501632, + "sensitivity": 0.5739509925005964 + }, + { + "name": "model.layers.27.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.158048538258299e-05, + "sensitivity": 0.8144017278924174 + }, + { + "name": "model.layers.27.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0386789881522418e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.363596523646265e-05, + "sensitivity": 0.7057946130204937 + }, + { + "name": "model.layers.27.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.73617614666e-05, + "sensitivity": 1.0613630927748505 + }, + { + "name": "model.layers.27.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.298902685055509e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.564041541423649e-05, + "sensitivity": 0.8029282396972294 + }, + { + "name": "model.layers.27.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8756821090355515e-05, + "sensitivity": 1.1139750563150939 + }, + { + "name": "model.layers.27.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.802135198493488e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006499493028968573, + "sensitivity": 0.5418985066462261 + }, + { + "name": "model.layers.27.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.183009827509522e-05, + "sensitivity": 0.9981074927665802 + }, + { + "name": "model.layers.27.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.087689250009134e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006809207843616605, + "sensitivity": 0.5443896307182087 + }, + { + "name": "model.layers.27.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.755706661147997e-05, + "sensitivity": 0.8474863751121067 + }, + { + "name": "model.layers.27.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.378040436378797e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006510355742648244, + "sensitivity": 0.5611174568528803 + }, + { + "name": "model.layers.27.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.914029316045344e-05, + "sensitivity": 1.087191160402956 + }, + { + "name": "model.layers.27.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.884197543717164e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006543115014210343, + "sensitivity": 0.585416721839086 + }, + { + "name": "model.layers.27.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006081392057240009, + "sensitivity": 0.5850200563401838 + }, + { + "name": "model.layers.27.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.162151748867473e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006300742388702929, + "sensitivity": 0.5357786867747565 + }, + { + "name": "model.layers.27.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 4.374996024125721e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3550717287434964e-06, + "sensitivity": 2.1006861060842814 + }, + { + "name": "model.layers.27.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.937963684729766e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.27.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.9620028979261406e-06, + "sensitivity": 2.1039647012340463 + }, + { + "name": "model.layers.27.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 3.422369991312735e-05, + "sensitivity": 1.9512029449160893 + }, + { + "name": "model.layers.27.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.0001760940212989226, + "sensitivity": 0.8561525697563467 + }, + { + "name": "model.layers.27.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.4316299711936153e-05, + "sensitivity": 1.2497829376172984 + }, + { + "name": "model.layers.27.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 4, + "mse": 1.2362863344606012e-05, + "sensitivity": 1.7385024860529614 + }, + { + "name": "model.layers.27.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00024785325513221323, + "sensitivity": 0.7570314386150334 + }, + { + "name": "model.layers.28.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1517098755575716e-05, + "sensitivity": 1.3845221120481037 + }, + { + "name": "model.layers.28.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.235366426044493e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.300222594290972e-05, + "sensitivity": 0.6171037872326194 + }, + { + "name": "model.layers.28.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.915984365856275e-05, + "sensitivity": 0.8207255057656406 + }, + { + "name": "model.layers.28.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.474081146734534e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006657486082985997, + "sensitivity": 0.5373346265949668 + }, + { + "name": "model.layers.28.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9264675655867904e-05, + "sensitivity": 0.7928243784429634 + }, + { + "name": "model.layers.28.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.283659897439065e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006783275748603046, + "sensitivity": 0.5343504565474738 + }, + { + "name": "model.layers.28.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.089310045354068e-05, + "sensitivity": 1.0112043354082088 + }, + { + "name": "model.layers.28.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.95663857186446e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006749384920112789, + "sensitivity": 0.5272141302122307 + }, + { + "name": "model.layers.28.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8853504015132785e-05, + "sensitivity": 0.767797311580168 + }, + { + "name": "model.layers.28.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.745196626274264e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006428570486605167, + "sensitivity": 0.5538698233223288 + }, + { + "name": "model.layers.28.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.175230762688443e-05, + "sensitivity": 0.6386149898445586 + }, + { + "name": "model.layers.28.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.729024223910528e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006064579356461763, + "sensitivity": 0.5448054630031786 + }, + { + "name": "model.layers.28.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1074560461565852e-05, + "sensitivity": 1.300341113594244 + }, + { + "name": "model.layers.28.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2048066082570585e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006850849604234099, + "sensitivity": 0.5792856311135804 + }, + { + "name": "model.layers.28.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8372268540551886e-05, + "sensitivity": 0.7087038090522175 + }, + { + "name": "model.layers.28.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0485204029464512e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.873500049347058e-05, + "sensitivity": 0.6929383021879858 + }, + { + "name": "model.layers.28.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.217576446942985e-05, + "sensitivity": 1.1498924725897361 + }, + { + "name": "model.layers.28.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.902825356926769e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000722693745046854, + "sensitivity": 0.5462541055587917 + }, + { + "name": "model.layers.28.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.574763392563909e-05, + "sensitivity": 0.8975571626114702 + }, + { + "name": "model.layers.28.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0201738405157812e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.632195436395705e-05, + "sensitivity": 0.6589211946951546 + }, + { + "name": "model.layers.28.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.866717401659116e-05, + "sensitivity": 0.6960977528777147 + }, + { + "name": "model.layers.28.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.636686293859384e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006761203403584659, + "sensitivity": 0.5262781665243321 + }, + { + "name": "model.layers.28.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.750277705374174e-05, + "sensitivity": 0.640724123122386 + }, + { + "name": "model.layers.28.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.402969686154393e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006664732354693115, + "sensitivity": 0.5329493765184738 + }, + { + "name": "model.layers.28.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.147289968794212e-05, + "sensitivity": 1.006274836211792 + }, + { + "name": "model.layers.28.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.556869038831792e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.136907904874533e-05, + "sensitivity": 0.6648555988683933 + }, + { + "name": "model.layers.28.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.604357284028083e-05, + "sensitivity": 1.0267485738301338 + }, + { + "name": "model.layers.28.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.137729767237033e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006815920351073146, + "sensitivity": 0.5179328404312741 + }, + { + "name": "model.layers.28.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.983300434309058e-05, + "sensitivity": 0.8836541281219474 + }, + { + "name": "model.layers.28.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.475907063460909e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006570428377017379, + "sensitivity": 0.5363534402834835 + }, + { + "name": "model.layers.28.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.829826113767922e-05, + "sensitivity": 0.8573711019697038 + }, + { + "name": "model.layers.28.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.273864983086241e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006609940901398659, + "sensitivity": 0.5274231008003196 + }, + { + "name": "model.layers.28.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1422262105043046e-05, + "sensitivity": 1.4560266423040886 + }, + { + "name": "model.layers.28.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.436868708689872e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.065690831746906e-05, + "sensitivity": 0.8180627705612841 + }, + { + "name": "model.layers.28.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.061400563339703e-05, + "sensitivity": 0.6932434192924551 + }, + { + "name": "model.layers.28.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.611855264462065e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006937377038411796, + "sensitivity": 0.5549329403697381 + }, + { + "name": "model.layers.28.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.449253851315007e-05, + "sensitivity": 0.7200468426547384 + }, + { + "name": "model.layers.28.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.806049436316243e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007630165200680494, + "sensitivity": 0.559927693429743 + }, + { + "name": "model.layers.28.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1119393093395047e-05, + "sensitivity": 1.4443114089478908 + }, + { + "name": "model.layers.28.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.294317694890196e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006443373276852071, + "sensitivity": 0.5614863768960535 + }, + { + "name": "model.layers.28.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.802817759104073e-05, + "sensitivity": 1.077268042673643 + }, + { + "name": "model.layers.28.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.002990870802023e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00064762745751068, + "sensitivity": 0.5281678749478926 + }, + { + "name": "model.layers.28.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.890499960514717e-05, + "sensitivity": 0.6339506119617764 + }, + { + "name": "model.layers.28.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.085098670562729e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000675192684866488, + "sensitivity": 0.5638026440283206 + }, + { + "name": "model.layers.28.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8286794228479266e-05, + "sensitivity": 0.6553369552194496 + }, + { + "name": "model.layers.28.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0889137911362923e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006539142923429608, + "sensitivity": 0.5440131242679858 + }, + { + "name": "model.layers.28.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.973782390356064e-05, + "sensitivity": 0.626382735990033 + }, + { + "name": "model.layers.28.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.798655244390829e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.013415986672044e-05, + "sensitivity": 0.6070579257144499 + }, + { + "name": "model.layers.28.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0933740668406244e-05, + "sensitivity": 1.3959551445713654 + }, + { + "name": "model.layers.28.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.214106077895849e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8029108913615346e-05, + "sensitivity": 0.7369832413226546 + }, + { + "name": "model.layers.28.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006781236152164638, + "sensitivity": 0.5291499154152135 + }, + { + "name": "model.layers.28.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.736474347235344e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006878258427605033, + "sensitivity": 0.5455611382991278 + }, + { + "name": "model.layers.28.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.85953748668544e-05, + "sensitivity": 0.6604650025029976 + }, + { + "name": "model.layers.28.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.37330231256783e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006867152405902743, + "sensitivity": 0.5353496565318944 + }, + { + "name": "model.layers.28.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.808087735204026e-05, + "sensitivity": 0.6195786288448822 + }, + { + "name": "model.layers.28.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.910101658126223e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006605664966627955, + "sensitivity": 0.5175739659711703 + }, + { + "name": "model.layers.28.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.425141327781603e-05, + "sensitivity": 0.8945409969839327 + }, + { + "name": "model.layers.28.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.639427389629418e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000746148347388953, + "sensitivity": 0.5394101651641264 + }, + { + "name": "model.layers.28.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.623642573482357e-05, + "sensitivity": 0.6981493970988233 + }, + { + "name": "model.layers.28.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.729707587917801e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006425504107028246, + "sensitivity": 0.5446858908352791 + }, + { + "name": "model.layers.28.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.771667929366231e-05, + "sensitivity": 1.043072170092894 + }, + { + "name": "model.layers.28.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6778694771346636e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8086414355784655e-05, + "sensitivity": 0.6336775457268262 + }, + { + "name": "model.layers.28.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0286295946571045e-05, + "sensitivity": 1.2720708364551605 + }, + { + "name": "model.layers.28.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.124210128495179e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006483166362158954, + "sensitivity": 0.5292551574166814 + }, + { + "name": "model.layers.28.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.03829394094646e-05, + "sensitivity": 0.6838314290241412 + }, + { + "name": "model.layers.28.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.626148092436779e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006796428933739662, + "sensitivity": 0.5377114467459789 + }, + { + "name": "model.layers.28.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.983950803871267e-06, + "sensitivity": 1.4171620371018916 + }, + { + "name": "model.layers.28.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.082386789785232e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005957980174571276, + "sensitivity": 0.5867069338461128 + }, + { + "name": "model.layers.28.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007051430875435472, + "sensitivity": 0.589400012276723 + }, + { + "name": "model.layers.28.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.397487706839456e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.322187255136669e-05, + "sensitivity": 0.6702334418199658 + }, + { + "name": "model.layers.28.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.233820749912411e-05, + "sensitivity": 0.6778683869009887 + }, + { + "name": "model.layers.28.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.739389502603444e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007077637128531933, + "sensitivity": 0.5376812765830634 + }, + { + "name": "model.layers.28.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.845688039902598e-05, + "sensitivity": 1.0396736290897197 + }, + { + "name": "model.layers.28.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.030115961650154e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.143474067561328e-05, + "sensitivity": 0.6248264622916615 + }, + { + "name": "model.layers.28.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.2241477533243597e-05, + "sensitivity": 0.9017219887392713 + }, + { + "name": "model.layers.28.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.143466973502655e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006028743810020387, + "sensitivity": 0.5151649229634709 + }, + { + "name": "model.layers.28.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.246287375688553e-05, + "sensitivity": 1.0064727279720493 + }, + { + "name": "model.layers.28.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.758940571671701e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007206174777820706, + "sensitivity": 0.5163782116134934 + }, + { + "name": "model.layers.28.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.854380287928507e-05, + "sensitivity": 0.9828884803775354 + }, + { + "name": "model.layers.28.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0652006494638044e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006579567561857402, + "sensitivity": 0.5639534274185943 + }, + { + "name": "model.layers.28.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9275596868246794e-05, + "sensitivity": 0.9987528851731046 + }, + { + "name": "model.layers.28.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.778033707632858e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006891472148708999, + "sensitivity": 0.5912340531527924 + }, + { + "name": "model.layers.28.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8089877711609006e-05, + "sensitivity": 1.0893866229993694 + }, + { + "name": "model.layers.28.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.290603096203995e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.933266947977245e-05, + "sensitivity": 0.6131824993769073 + }, + { + "name": "model.layers.28.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.7811854579340434e-06, + "sensitivity": 2.0978541064883722 + }, + { + "name": "model.layers.28.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6521771613042802e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.854350067442283e-05, + "sensitivity": 0.7121417744227643 + }, + { + "name": "model.layers.28.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0931343240372371e-05, + "sensitivity": 1.458821667791365 + }, + { + "name": "model.layers.28.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.31569082038186e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006785143632441759, + "sensitivity": 0.5437391006811213 + }, + { + "name": "model.layers.28.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.470739026553929e-05, + "sensitivity": 0.9324797120502207 + }, + { + "name": "model.layers.28.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1568572517717257e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007516397163271904, + "sensitivity": 0.5587344518079542 + }, + { + "name": "model.layers.28.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.044458132237196e-05, + "sensitivity": 1.065522808238687 + }, + { + "name": "model.layers.28.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.495884233321704e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.964516822132282e-05, + "sensitivity": 0.6450792591913838 + }, + { + "name": "model.layers.28.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.279005174292251e-05, + "sensitivity": 0.6404639296635584 + }, + { + "name": "model.layers.28.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.020678023967776e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007180289831012487, + "sensitivity": 0.5240334219414674 + }, + { + "name": "model.layers.28.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.884558049729094e-05, + "sensitivity": 0.9194892912211226 + }, + { + "name": "model.layers.28.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3318931451067328e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.72594981349539e-05, + "sensitivity": 0.6520209732223019 + }, + { + "name": "model.layers.28.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007133157923817635, + "sensitivity": 0.5652289004274336 + }, + { + "name": "model.layers.28.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.978086955517938e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007206270820461214, + "sensitivity": 0.5349936654473556 + }, + { + "name": "model.layers.28.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.289721204666421e-05, + "sensitivity": 1.0604471067032206 + }, + { + "name": "model.layers.28.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2000239166809479e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.19155471213162e-05, + "sensitivity": 0.7886211558309308 + }, + { + "name": "model.layers.28.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006505344063043594, + "sensitivity": 0.5559563699226795 + }, + { + "name": "model.layers.28.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.961429335206049e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006614547455683351, + "sensitivity": 0.5372441272969999 + }, + { + "name": "model.layers.28.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4428994189947844e-05, + "sensitivity": 0.9322809397296452 + }, + { + "name": "model.layers.28.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.276102340052603e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.715392035199329e-05, + "sensitivity": 0.6370349331749222 + }, + { + "name": "model.layers.28.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.571246922248974e-05, + "sensitivity": 0.7936023131855989 + }, + { + "name": "model.layers.28.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.35572258841421e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007760361768305302, + "sensitivity": 0.5994543032267188 + }, + { + "name": "model.layers.28.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.421526657301001e-05, + "sensitivity": 0.6068380256072244 + }, + { + "name": "model.layers.28.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.027148629073054e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006373185315169394, + "sensitivity": 0.5458608971655083 + }, + { + "name": "model.layers.28.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.127447704784572e-05, + "sensitivity": 0.888038785071647 + }, + { + "name": "model.layers.28.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.456365776510211e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000687946449033916, + "sensitivity": 0.5528346957227531 + }, + { + "name": "model.layers.28.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.663709816872142e-05, + "sensitivity": 0.659516305615286 + }, + { + "name": "model.layers.28.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.517793735838495e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006496310234069824, + "sensitivity": 0.5702099881270537 + }, + { + "name": "model.layers.28.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.308791489573196e-05, + "sensitivity": 0.7912834917742791 + }, + { + "name": "model.layers.28.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0568131756372168e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007095853798091412, + "sensitivity": 0.5506845417297036 + }, + { + "name": "model.layers.28.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.178260082378983e-05, + "sensitivity": 0.7220366704862622 + }, + { + "name": "model.layers.28.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.263172048827983e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007009397959336638, + "sensitivity": 0.5180845050300533 + }, + { + "name": "model.layers.28.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.927733946009539e-05, + "sensitivity": 0.6857538373807325 + }, + { + "name": "model.layers.28.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0973456028295914e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006766663282178342, + "sensitivity": 0.5318873486268223 + }, + { + "name": "model.layers.28.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.526322977151722e-05, + "sensitivity": 0.9809919719862861 + }, + { + "name": "model.layers.28.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.632684966869419e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.56214397167787e-05, + "sensitivity": 0.693782698302144 + }, + { + "name": "model.layers.28.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.157565076136962e-05, + "sensitivity": 0.6108976481196985 + }, + { + "name": "model.layers.28.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.39800009089231e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006914960104040802, + "sensitivity": 0.5410978766304497 + }, + { + "name": "model.layers.28.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3124076657695696e-05, + "sensitivity": 0.7632922041735228 + }, + { + "name": "model.layers.28.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.212451353349024e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006113330600783229, + "sensitivity": 0.5443667527144924 + }, + { + "name": "model.layers.28.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.783961387351155e-05, + "sensitivity": 0.9927341750697767 + }, + { + "name": "model.layers.28.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.475303729937878e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006453141686506569, + "sensitivity": 0.5253810678740389 + }, + { + "name": "model.layers.28.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.567068339791149e-05, + "sensitivity": 0.8070947229489885 + }, + { + "name": "model.layers.28.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.325666271957743e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007650158368051052, + "sensitivity": 0.548946497516127 + }, + { + "name": "model.layers.28.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 4.076369350514142e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3591956050950103e-06, + "sensitivity": 2.1013863793855396 + }, + { + "name": "model.layers.28.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.214302968350239e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.28.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.926277491293149e-06, + "sensitivity": 2.105096517925529 + }, + { + "name": "model.layers.28.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 9.340635187982116e-06, + "sensitivity": 2.214850930883572 + }, + { + "name": "model.layers.28.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.0002082700520986691, + "sensitivity": 0.8735159737834655 + }, + { + "name": "model.layers.28.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.5722242096671835e-05, + "sensitivity": 1.2867135701127401 + }, + { + "name": "model.layers.28.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 2, + "mse": 0.0006687938002869487, + "sensitivity": 0.5640842856143823 + }, + { + "name": "model.layers.28.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0003138853353448212, + "sensitivity": 1.1068699345194186 + }, + { + "name": "model.layers.29.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.2202923244331032e-05, + "sensitivity": 1.2428196903957014 + }, + { + "name": "model.layers.29.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.793938622540736e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.709701847285032e-05, + "sensitivity": 0.7661643064086392 + }, + { + "name": "model.layers.29.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8579746109899133e-05, + "sensitivity": 0.8625076854763248 + }, + { + "name": "model.layers.29.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.088291908985411e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006722623365931213, + "sensitivity": 0.5861116375587321 + }, + { + "name": "model.layers.29.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6195727665908635e-05, + "sensitivity": 0.7857206036264581 + }, + { + "name": "model.layers.29.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.056473805278074e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006662987871095538, + "sensitivity": 0.5242402240112217 + }, + { + "name": "model.layers.29.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.298573134699836e-05, + "sensitivity": 0.7941621586085202 + }, + { + "name": "model.layers.29.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.027045848597481e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000718500348739326, + "sensitivity": 0.5398256409695666 + }, + { + "name": "model.layers.29.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.997763219056651e-05, + "sensitivity": 0.9422023574309845 + }, + { + "name": "model.layers.29.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.827529202586447e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006820994894951582, + "sensitivity": 0.5156950746868437 + }, + { + "name": "model.layers.29.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7777429901761934e-05, + "sensitivity": 0.8031297770775302 + }, + { + "name": "model.layers.29.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.349869974859757e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006921006715856493, + "sensitivity": 0.5894159202616576 + }, + { + "name": "model.layers.29.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006293547339737415, + "sensitivity": 0.5767885804903992 + }, + { + "name": "model.layers.29.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.029985908957315e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006501083262264729, + "sensitivity": 0.5222201841215119 + }, + { + "name": "model.layers.29.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0422586456115823e-05, + "sensitivity": 1.8262739473891656 + }, + { + "name": "model.layers.29.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.732021802235977e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.092646799515933e-05, + "sensitivity": 0.6801860364973717 + }, + { + "name": "model.layers.29.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.57519742869772e-05, + "sensitivity": 0.9318497535566537 + }, + { + "name": "model.layers.29.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.853702186366718e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006657260237261653, + "sensitivity": 0.5008463755297006 + }, + { + "name": "model.layers.29.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0431641385366675e-05, + "sensitivity": 1.2564126978783483 + }, + { + "name": "model.layers.29.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.282388535008067e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006376872770488262, + "sensitivity": 0.5781821326730185 + }, + { + "name": "model.layers.29.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.232323847943917e-05, + "sensitivity": 1.23222239596985 + }, + { + "name": "model.layers.29.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0076587386720348e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007745804032310843, + "sensitivity": 0.5231661935098895 + }, + { + "name": "model.layers.29.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1087429811595939e-05, + "sensitivity": 1.3052851872857085 + }, + { + "name": "model.layers.29.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.89092950981285e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006961814360693097, + "sensitivity": 0.568521998607951 + }, + { + "name": "model.layers.29.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.789749411633238e-05, + "sensitivity": 1.1862038067853358 + }, + { + "name": "model.layers.29.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0700545090003288e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006612049182876945, + "sensitivity": 0.5740127970590566 + }, + { + "name": "model.layers.29.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1066964361816645e-05, + "sensitivity": 1.8996516360439744 + }, + { + "name": "model.layers.29.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.110686854299274e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006680000806227326, + "sensitivity": 0.5398895505502513 + }, + { + "name": "model.layers.29.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.989139754092321e-05, + "sensitivity": 1.153840678749005 + }, + { + "name": "model.layers.29.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.973207516442926e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006780295516364276, + "sensitivity": 0.5714887544583714 + }, + { + "name": "model.layers.29.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006712726317346096, + "sensitivity": 0.5677780107920719 + }, + { + "name": "model.layers.29.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.489924200854148e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006913216784596443, + "sensitivity": 0.5340704240354985 + }, + { + "name": "model.layers.29.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9222507843514904e-05, + "sensitivity": 0.649827532947755 + }, + { + "name": "model.layers.29.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.931711252240348e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000686544575728476, + "sensitivity": 0.588246013381343 + }, + { + "name": "model.layers.29.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007178501691669226, + "sensitivity": 0.5877178282840966 + }, + { + "name": "model.layers.29.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.079519832586811e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007223798893392086, + "sensitivity": 0.5625320938861073 + }, + { + "name": "model.layers.29.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1012469258275814e-05, + "sensitivity": 1.4571201852828575 + }, + { + "name": "model.layers.29.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.967941317270743e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.108960951678455e-05, + "sensitivity": 0.6055201292619797 + }, + { + "name": "model.layers.29.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.926140147494152e-05, + "sensitivity": 1.0577604404584524 + }, + { + "name": "model.layers.29.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.906323844508734e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006800724077038467, + "sensitivity": 0.525615337943894 + }, + { + "name": "model.layers.29.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.233587919268757e-05, + "sensitivity": 0.9036201411088436 + }, + { + "name": "model.layers.29.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.834031177684665e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006956764264032245, + "sensitivity": 0.5367365210087323 + }, + { + "name": "model.layers.29.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.133883289294317e-05, + "sensitivity": 1.1063866674393905 + }, + { + "name": "model.layers.29.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.647083061281592e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.078482692828402e-05, + "sensitivity": 0.7385075662368118 + }, + { + "name": "model.layers.29.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.430511712096632e-05, + "sensitivity": 1.1155245392844504 + }, + { + "name": "model.layers.29.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.49173239000811e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007354483823291957, + "sensitivity": 0.5371326534003364 + }, + { + "name": "model.layers.29.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7947789173340425e-05, + "sensitivity": 0.6919189512275715 + }, + { + "name": "model.layers.29.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.879747616039822e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000661009456962347, + "sensitivity": 0.5075702350296191 + }, + { + "name": "model.layers.29.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006237146444618702, + "sensitivity": 0.5660342879166813 + }, + { + "name": "model.layers.29.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.175422413434717e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006687139975838363, + "sensitivity": 0.5737755669729333 + }, + { + "name": "model.layers.29.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.566625961568207e-05, + "sensitivity": 0.796951613502413 + }, + { + "name": "model.layers.29.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0353799098083982e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007504690438508987, + "sensitivity": 0.5375219017448513 + }, + { + "name": "model.layers.29.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9802037867484614e-05, + "sensitivity": 0.6798338137765498 + }, + { + "name": "model.layers.29.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.311515790002886e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006779401446692646, + "sensitivity": 0.5254973802199494 + }, + { + "name": "model.layers.29.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.283110997173935e-05, + "sensitivity": 0.795784823259125 + }, + { + "name": "model.layers.29.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4023775065652444e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007018701871857047, + "sensitivity": 0.5457532178411342 + }, + { + "name": "model.layers.29.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6196404329966754e-05, + "sensitivity": 1.077523618590845 + }, + { + "name": "model.layers.29.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.569138122358709e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006603479268960655, + "sensitivity": 0.5695466827858201 + }, + { + "name": "model.layers.29.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0752041816886049e-05, + "sensitivity": 1.438171971506604 + }, + { + "name": "model.layers.29.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.768734798853984e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7757853937800974e-05, + "sensitivity": 0.6028970442222918 + }, + { + "name": "model.layers.29.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.138226308394223e-05, + "sensitivity": 0.8964289761600084 + }, + { + "name": "model.layers.29.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.901593784888973e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000711970729753375, + "sensitivity": 0.5863898417525213 + }, + { + "name": "model.layers.29.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0421465958643239e-05, + "sensitivity": 1.3297568669006965 + }, + { + "name": "model.layers.29.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.504629249728168e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006424713646993041, + "sensitivity": 0.5797313588826508 + }, + { + "name": "model.layers.29.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.034183024894446e-05, + "sensitivity": 0.7551102994747794 + }, + { + "name": "model.layers.29.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.961083383634104e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006856407853774726, + "sensitivity": 0.5857623295934988 + }, + { + "name": "model.layers.29.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.09804701525718e-05, + "sensitivity": 0.9258250507563723 + }, + { + "name": "model.layers.29.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.989495773268573e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000705176149494946, + "sensitivity": 0.5613614368827883 + }, + { + "name": "model.layers.29.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.198450864758343e-05, + "sensitivity": 0.6375846212817792 + }, + { + "name": "model.layers.29.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.739246825622104e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007079929928295314, + "sensitivity": 0.5326762379515698 + }, + { + "name": "model.layers.29.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.163555498351343e-05, + "sensitivity": 1.230595093148923 + }, + { + "name": "model.layers.29.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.94154333966435e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.411809590645134e-05, + "sensitivity": 0.805587051807257 + }, + { + "name": "model.layers.29.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1243765584367793e-05, + "sensitivity": 1.241634105147677 + }, + { + "name": "model.layers.29.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.475347842955671e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006898852298036218, + "sensitivity": 0.5839526989530381 + }, + { + "name": "model.layers.29.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1175480722158682e-05, + "sensitivity": 1.3589498417227364 + }, + { + "name": "model.layers.29.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0268778396493872e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.128239328972995e-05, + "sensitivity": 1.0226825999244105 + }, + { + "name": "model.layers.29.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.3500389286491554e-05, + "sensitivity": 1.2856436479466968 + }, + { + "name": "model.layers.29.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0672217740648193e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.817922596586868e-05, + "sensitivity": 0.735424878448092 + }, + { + "name": "model.layers.29.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8055913541466e-05, + "sensitivity": 0.6472351196485872 + }, + { + "name": "model.layers.29.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.810197300590517e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006911588134244084, + "sensitivity": 0.539744523902177 + }, + { + "name": "model.layers.29.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1501897461130284e-05, + "sensitivity": 1.6607179458976082 + }, + { + "name": "model.layers.29.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.891829222397064e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.287913856795058e-05, + "sensitivity": 0.7105980994435643 + }, + { + "name": "model.layers.29.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8686156990006566e-05, + "sensitivity": 0.6456902895304898 + }, + { + "name": "model.layers.29.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.825528882676736e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006794440560042858, + "sensitivity": 0.521410162012892 + }, + { + "name": "model.layers.29.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7550765632186085e-05, + "sensitivity": 0.9266006562597509 + }, + { + "name": "model.layers.29.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.680682756472379e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006679994985461235, + "sensitivity": 0.5045260072667561 + }, + { + "name": "model.layers.29.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.96625468460843e-05, + "sensitivity": 1.127357061817252 + }, + { + "name": "model.layers.29.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.079819278667856e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006761566619388759, + "sensitivity": 0.5431194106430701 + }, + { + "name": "model.layers.29.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.376586679834872e-05, + "sensitivity": 0.6759466703952788 + }, + { + "name": "model.layers.29.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.266098916465126e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.42963859718293e-05, + "sensitivity": 0.6660097341938759 + }, + { + "name": "model.layers.29.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0922470210061874e-05, + "sensitivity": 1.7621816466696123 + }, + { + "name": "model.layers.29.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.929210141810472e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00067975337151438, + "sensitivity": 0.5844808968714085 + }, + { + "name": "model.layers.29.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.343980930978432e-05, + "sensitivity": 1.083174489513817 + }, + { + "name": "model.layers.29.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1778834050346632e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007397168083116412, + "sensitivity": 0.5205947016472083 + }, + { + "name": "model.layers.29.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8955163694918156e-05, + "sensitivity": 0.9503366381029716 + }, + { + "name": "model.layers.29.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.689407877682243e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006602643406949937, + "sensitivity": 0.5558265280590873 + }, + { + "name": "model.layers.29.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.923423304921016e-05, + "sensitivity": 0.7318780769070845 + }, + { + "name": "model.layers.29.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.675053896287864e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006760814576409757, + "sensitivity": 0.5222850768586121 + }, + { + "name": "model.layers.29.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.198509072419256e-05, + "sensitivity": 1.0467227833139205 + }, + { + "name": "model.layers.29.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0941247410301003e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.359622057061642e-05, + "sensitivity": 0.6696242068648006 + }, + { + "name": "model.layers.29.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.422137473942712e-05, + "sensitivity": 0.9215037161725961 + }, + { + "name": "model.layers.29.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.293425940384623e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006459978758357465, + "sensitivity": 0.5589603451073145 + }, + { + "name": "model.layers.29.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.876378756714985e-05, + "sensitivity": 0.8206796680977609 + }, + { + "name": "model.layers.29.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.695794460640172e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007909519481472671, + "sensitivity": 0.5592413850257201 + }, + { + "name": "model.layers.29.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.260158988879994e-05, + "sensitivity": 0.8584946706150576 + }, + { + "name": "model.layers.29.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.556765808658383e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007190449978224933, + "sensitivity": 0.5270427544447248 + }, + { + "name": "model.layers.29.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.188862607814372e-05, + "sensitivity": 0.8598400868669094 + }, + { + "name": "model.layers.29.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.433704922732431e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007041522767394781, + "sensitivity": 0.5939115945707742 + }, + { + "name": "model.layers.29.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1699459719238803e-05, + "sensitivity": 1.351683140597715 + }, + { + "name": "model.layers.29.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0357935025240295e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.420719728339463e-05, + "sensitivity": 0.6220629446744618 + }, + { + "name": "model.layers.29.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0798736184369773e-05, + "sensitivity": 1.2822720815714983 + }, + { + "name": "model.layers.29.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.989412438291765e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.880851676920429e-05, + "sensitivity": 0.6410048427064311 + }, + { + "name": "model.layers.29.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.028365169186145e-05, + "sensitivity": 1.1083570109043792 + }, + { + "name": "model.layers.29.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.531968660463463e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006908149225637317, + "sensitivity": 0.5345563651933907 + }, + { + "name": "model.layers.29.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.265808431431651e-05, + "sensitivity": 1.0788281190084836 + }, + { + "name": "model.layers.29.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0629898952174699e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.459458043333143e-05, + "sensitivity": 0.7556311788148847 + }, + { + "name": "model.layers.29.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.83390865358524e-05, + "sensitivity": 1.0535404893695808 + }, + { + "name": "model.layers.29.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0908049716817914e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.879052332602441e-05, + "sensitivity": 0.7183428750320041 + }, + { + "name": "model.layers.29.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0993431715178303e-05, + "sensitivity": 1.2326023219237154 + }, + { + "name": "model.layers.29.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.711209258966846e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000676387338899076, + "sensitivity": 0.5116077436750265 + }, + { + "name": "model.layers.29.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.432647205656394e-05, + "sensitivity": 1.0017480219088917 + }, + { + "name": "model.layers.29.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.376708595074888e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007347021019086242, + "sensitivity": 0.5224913083325531 + }, + { + "name": "model.layers.29.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1400333278288599e-05, + "sensitivity": 1.5576240295820754 + }, + { + "name": "model.layers.29.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.995477406235295e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006943045882508159, + "sensitivity": 0.5048246666250034 + }, + { + "name": "model.layers.29.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.011391476728022e-05, + "sensitivity": 1.183016337614897 + }, + { + "name": "model.layers.29.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.692517106581363e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006028522620908916, + "sensitivity": 0.5095738504080318 + }, + { + "name": "model.layers.29.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8794597862288356e-05, + "sensitivity": 0.9245617575536266 + }, + { + "name": "model.layers.29.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1629790606093593e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006719491793774068, + "sensitivity": 0.5295724505497401 + }, + { + "name": "model.layers.29.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 3.8845482777105644e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.589534688013373e-06, + "sensitivity": 2.102444515648742 + }, + { + "name": "model.layers.29.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0225389814877417e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.29.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 8.044953574426472e-06, + "sensitivity": 1.9103508405580032 + }, + { + "name": "model.layers.29.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 9.417742148798425e-06, + "sensitivity": 2.055706685766689 + }, + { + "name": "model.layers.29.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.000219018169445917, + "sensitivity": 0.8624596053524523 + }, + { + "name": "model.layers.29.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.5322419130825438e-05, + "sensitivity": 1.052707068247565 + }, + { + "name": "model.layers.29.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.8257497585145757e-05, + "sensitivity": 0.6497595872171725 + }, + { + "name": "model.layers.29.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0003324975841678679, + "sensitivity": 0.7475651932465758 + }, + { + "name": "model.layers.30.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.015154576743953e-05, + "sensitivity": 0.7426248567302006 + }, + { + "name": "model.layers.30.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.708102197691915e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006990457768552005, + "sensitivity": 0.570338974266182 + }, + { + "name": "model.layers.30.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0257415851810947e-05, + "sensitivity": 1.341510098576097 + }, + { + "name": "model.layers.30.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4229308362700976e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006257821805775166, + "sensitivity": 0.557440358996066 + }, + { + "name": "model.layers.30.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.416493316559354e-06, + "sensitivity": 2.068032270043641 + }, + { + "name": "model.layers.30.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.421631380566396e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006835166714154184, + "sensitivity": 0.5369512121082289 + }, + { + "name": "model.layers.30.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.968460027361289e-05, + "sensitivity": 0.6299516066963418 + }, + { + "name": "model.layers.30.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.458995128217794e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006997189484536648, + "sensitivity": 0.5421818028623373 + }, + { + "name": "model.layers.30.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006527408841066062, + "sensitivity": 0.5457427932893928 + }, + { + "name": "model.layers.30.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.343693712551612e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000652086571790278, + "sensitivity": 0.5183539764359181 + }, + { + "name": "model.layers.30.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006958710728213191, + "sensitivity": 0.5268857457250861 + }, + { + "name": "model.layers.30.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.23251218914811e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007068949053063989, + "sensitivity": 0.5297693285126956 + }, + { + "name": "model.layers.30.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.775525642093271e-05, + "sensitivity": 0.6459913728286961 + }, + { + "name": "model.layers.30.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.636366490260116e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006463612662628293, + "sensitivity": 0.5280918235111568 + }, + { + "name": "model.layers.30.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.2382281864993274e-05, + "sensitivity": 0.730148379891373 + }, + { + "name": "model.layers.30.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.969402536720736e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006135470466688275, + "sensitivity": 0.5375751724808642 + }, + { + "name": "model.layers.30.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.635462341364473e-05, + "sensitivity": 0.6607404951264891 + }, + { + "name": "model.layers.30.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.353126984024129e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007420014590024948, + "sensitivity": 0.5805494042852634 + }, + { + "name": "model.layers.30.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.411562945781043e-06, + "sensitivity": 2.097195952399568 + }, + { + "name": "model.layers.30.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1588028883124935e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.18297272012569e-05, + "sensitivity": 0.7682464693916097 + }, + { + "name": "model.layers.30.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0808637499576434e-05, + "sensitivity": 0.7145488850709897 + }, + { + "name": "model.layers.30.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.111655122571392e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006838343106210232, + "sensitivity": 0.5822331405121125 + }, + { + "name": "model.layers.30.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006563186179846525, + "sensitivity": 0.5312036906048698 + }, + { + "name": "model.layers.30.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.58748569751333e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006964618805795908, + "sensitivity": 0.5298753878260306 + }, + { + "name": "model.layers.30.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006754223140887916, + "sensitivity": 0.5156401130429054 + }, + { + "name": "model.layers.30.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.447945336025441e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006823883741162717, + "sensitivity": 0.5107908400844566 + }, + { + "name": "model.layers.30.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006073982222005725, + "sensitivity": 0.5254207564720779 + }, + { + "name": "model.layers.30.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.274547104112571e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006089885719120502, + "sensitivity": 0.5631131213536003 + }, + { + "name": "model.layers.30.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006655773613601923, + "sensitivity": 0.555978133400762 + }, + { + "name": "model.layers.30.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.66364451010304e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006464900798164308, + "sensitivity": 0.5394717314773105 + }, + { + "name": "model.layers.30.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.25215470790863e-05, + "sensitivity": 0.8981661383305738 + }, + { + "name": "model.layers.30.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.160312401945703e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007082045776769519, + "sensitivity": 0.5297602055596318 + }, + { + "name": "model.layers.30.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.308461161097512e-05, + "sensitivity": 0.8069084378586999 + }, + { + "name": "model.layers.30.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.778459464840125e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007002949714660645, + "sensitivity": 0.5352083518415255 + }, + { + "name": "model.layers.30.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.609127038042061e-05, + "sensitivity": 0.986270045721959 + }, + { + "name": "model.layers.30.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2706118468486238e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006351824849843979, + "sensitivity": 0.5286329893672858 + }, + { + "name": "model.layers.30.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.066116475267336e-05, + "sensitivity": 0.6218357283518234 + }, + { + "name": "model.layers.30.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.527363325403712e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006956635043025017, + "sensitivity": 0.5063376454329676 + }, + { + "name": "model.layers.30.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006834025261923671, + "sensitivity": 0.532428491987421 + }, + { + "name": "model.layers.30.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.93891479386366e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006704911356791854, + "sensitivity": 0.5246352978118395 + }, + { + "name": "model.layers.30.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.699572259094566e-05, + "sensitivity": 0.7592780785958149 + }, + { + "name": "model.layers.30.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.041525004249706e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008001071400940418, + "sensitivity": 0.5201011674764794 + }, + { + "name": "model.layers.30.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.042468885425478e-05, + "sensitivity": 0.6490340403344277 + }, + { + "name": "model.layers.30.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1952124623348936e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006754541536793113, + "sensitivity": 0.5893423985990394 + }, + { + "name": "model.layers.30.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007010068511590362, + "sensitivity": 0.5273114252977092 + }, + { + "name": "model.layers.30.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.999040351729491e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007172173354774714, + "sensitivity": 0.5270306134711955 + }, + { + "name": "model.layers.30.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.67907006572932e-05, + "sensitivity": 0.6118122355639802 + }, + { + "name": "model.layers.30.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.126656894091866e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007512892480008304, + "sensitivity": 0.5399264717840342 + }, + { + "name": "model.layers.30.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.008451964589767e-05, + "sensitivity": 0.8854572099077197 + }, + { + "name": "model.layers.30.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.219863272846851e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000699728901963681, + "sensitivity": 0.5180591156333413 + }, + { + "name": "model.layers.30.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006918796570971608, + "sensitivity": 0.5580297169804179 + }, + { + "name": "model.layers.30.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.048790505199577e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006738638039678335, + "sensitivity": 0.5185833491562031 + }, + { + "name": "model.layers.30.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.27662957413122e-05, + "sensitivity": 1.0814659311030466 + }, + { + "name": "model.layers.30.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.413457746632048e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007094471948221326, + "sensitivity": 0.5640582882641668 + }, + { + "name": "model.layers.30.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0162171747651882e-05, + "sensitivity": 1.218976329322489 + }, + { + "name": "model.layers.30.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.677605822209443e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.799374412163161e-05, + "sensitivity": 0.619416337755879 + }, + { + "name": "model.layers.30.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8360510593047366e-05, + "sensitivity": 1.1677657418330314 + }, + { + "name": "model.layers.30.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.812866786276572e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006855240790173411, + "sensitivity": 0.5160652001522761 + }, + { + "name": "model.layers.30.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.099830352468416e-05, + "sensitivity": 0.9548676359623324 + }, + { + "name": "model.layers.30.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.200710696342867e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.188444967847317e-05, + "sensitivity": 0.6023869635624379 + }, + { + "name": "model.layers.30.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.634227636619471e-05, + "sensitivity": 0.733555979292331 + }, + { + "name": "model.layers.30.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.315488801395986e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6012584536802024e-05, + "sensitivity": 0.6359785545623443 + }, + { + "name": "model.layers.30.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.044408418238163e-05, + "sensitivity": 1.2033294355967934 + }, + { + "name": "model.layers.30.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.308987963166146e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006480125593952835, + "sensitivity": 0.5548057581737598 + }, + { + "name": "model.layers.30.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.284918345045298e-05, + "sensitivity": 0.6717903528204221 + }, + { + "name": "model.layers.30.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.661486390337814e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000710463966242969, + "sensitivity": 0.5555197050832431 + }, + { + "name": "model.layers.30.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.311116077180486e-06, + "sensitivity": 2.0969564656731934 + }, + { + "name": "model.layers.30.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0233148941551917e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.632851389236748e-05, + "sensitivity": 0.630907247094808 + }, + { + "name": "model.layers.30.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.033224053680897e-05, + "sensitivity": 0.6442301639298704 + }, + { + "name": "model.layers.30.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.342804337895359e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006754806963726878, + "sensitivity": 0.5561440616800098 + }, + { + "name": "model.layers.30.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007118529174476862, + "sensitivity": 0.5422963772813969 + }, + { + "name": "model.layers.30.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.256641876869253e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007107066339813173, + "sensitivity": 0.5588908812659912 + }, + { + "name": "model.layers.30.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.225402466952801e-05, + "sensitivity": 0.7906861539903387 + }, + { + "name": "model.layers.30.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.479971711494727e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.446888437494636e-05, + "sensitivity": 0.6032756506953696 + }, + { + "name": "model.layers.30.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0619626310653985e-05, + "sensitivity": 0.6361755813530433 + }, + { + "name": "model.layers.30.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.904165724743507e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000665870844386518, + "sensitivity": 0.553426458133951 + }, + { + "name": "model.layers.30.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0791539352794643e-05, + "sensitivity": 1.6829568291601338 + }, + { + "name": "model.layers.30.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.070061312537291e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006561347981914878, + "sensitivity": 0.5469639422869249 + }, + { + "name": "model.layers.30.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1938354873564094e-05, + "sensitivity": 1.3713120082585726 + }, + { + "name": "model.layers.30.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.141029752550821e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007126179407350719, + "sensitivity": 0.541734676034441 + }, + { + "name": "model.layers.30.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006823695148341358, + "sensitivity": 0.5242518275347718 + }, + { + "name": "model.layers.30.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.346495405930909e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006622931687161326, + "sensitivity": 0.5347347814650977 + }, + { + "name": "model.layers.30.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0005722594214603305, + "sensitivity": 0.5160303290752728 + }, + { + "name": "model.layers.30.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.777962428510364e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006014804821461439, + "sensitivity": 0.5754627319974269 + }, + { + "name": "model.layers.30.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.832753231516108e-05, + "sensitivity": 0.6650601408621338 + }, + { + "name": "model.layers.30.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.423597819273709e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006914226105436683, + "sensitivity": 0.5302615652543387 + }, + { + "name": "model.layers.30.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006521005998365581, + "sensitivity": 0.5416308612017834 + }, + { + "name": "model.layers.30.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.785887194382667e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006727149593643844, + "sensitivity": 0.5354997677898555 + }, + { + "name": "model.layers.30.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.51544944755733e-05, + "sensitivity": 0.636079790850619 + }, + { + "name": "model.layers.30.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.472079689956445e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006613274454139173, + "sensitivity": 0.507410377369462 + }, + { + "name": "model.layers.30.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006492552347481251, + "sensitivity": 0.5308803764242738 + }, + { + "name": "model.layers.30.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.755552703907597e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006690435111522675, + "sensitivity": 0.5411096740341178 + }, + { + "name": "model.layers.30.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.460402356518898e-06, + "sensitivity": 2.0200801708431744 + }, + { + "name": "model.layers.30.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.79949959400983e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000674651877488941, + "sensitivity": 0.5680931246618184 + }, + { + "name": "model.layers.30.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.299297092482448e-05, + "sensitivity": 0.8867253477220367 + }, + { + "name": "model.layers.30.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.157261734391795e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007330344524234533, + "sensitivity": 0.560721048773979 + }, + { + "name": "model.layers.30.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.222270894795656e-05, + "sensitivity": 0.7954661401723553 + }, + { + "name": "model.layers.30.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.009703265088319e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006806800956837833, + "sensitivity": 0.5455696565941418 + }, + { + "name": "model.layers.30.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.974786472506821e-05, + "sensitivity": 0.6723743552272199 + }, + { + "name": "model.layers.30.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.445172514053411e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007063198718242347, + "sensitivity": 0.5576978653888438 + }, + { + "name": "model.layers.30.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5851429351605475e-05, + "sensitivity": 0.7364756085932235 + }, + { + "name": "model.layers.30.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.620248538842134e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.893485649721697e-05, + "sensitivity": 0.8522049513356869 + }, + { + "name": "model.layers.30.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.370234041241929e-05, + "sensitivity": 0.6197783540478244 + }, + { + "name": "model.layers.30.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.212435662040662e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007217250531539321, + "sensitivity": 0.5321019213411731 + }, + { + "name": "model.layers.30.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000654602306894958, + "sensitivity": 0.530465275731082 + }, + { + "name": "model.layers.30.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.233106427724124e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006613265722990036, + "sensitivity": 0.5222997290923046 + }, + { + "name": "model.layers.30.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0877035139128566e-05, + "sensitivity": 0.7457574150362853 + }, + { + "name": "model.layers.30.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.526483270543395e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006738962838426232, + "sensitivity": 0.534732496544086 + }, + { + "name": "model.layers.30.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006636708858422935, + "sensitivity": 0.5195797426537276 + }, + { + "name": "model.layers.30.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.641471029273816e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006632024305872619, + "sensitivity": 0.5196129123776887 + }, + { + "name": "model.layers.30.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9599551605060697e-05, + "sensitivity": 1.0057646697736238 + }, + { + "name": "model.layers.30.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.830584986048052e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006895669503137469, + "sensitivity": 0.5602400107011698 + }, + { + "name": "model.layers.30.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.854888488305733e-05, + "sensitivity": 0.8415411470399301 + }, + { + "name": "model.layers.30.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.822599622566486e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008085812442004681, + "sensitivity": 0.5280799334258095 + }, + { + "name": "model.layers.30.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006746994331479073, + "sensitivity": 0.5898004915216961 + }, + { + "name": "model.layers.30.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.446526524290675e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006855802494101226, + "sensitivity": 0.5336895431191634 + }, + { + "name": "model.layers.30.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.2129424248996656e-05, + "sensitivity": 1.6884000705170799 + }, + { + "name": "model.layers.30.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0735639079939574e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007837393786758184, + "sensitivity": 0.5348358995309848 + }, + { + "name": "model.layers.30.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006310338503681123, + "sensitivity": 0.5762165648324461 + }, + { + "name": "model.layers.30.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.931494110380299e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006336253136396408, + "sensitivity": 0.5339243528805794 + }, + { + "name": "model.layers.30.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.347291491692886e-05, + "sensitivity": 0.7781287257797715 + }, + { + "name": "model.layers.30.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0433032002765685e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000784137926530093, + "sensitivity": 0.562086903939062 + }, + { + "name": "model.layers.30.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006617470644414425, + "sensitivity": 0.575948489812812 + }, + { + "name": "model.layers.30.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.942205115796241e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006689120782539248, + "sensitivity": 0.5317671789060421 + }, + { + "name": "model.layers.30.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.072557152947411e-05, + "sensitivity": 0.7557548082297848 + }, + { + "name": "model.layers.30.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.698338665955816e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007093813037499785, + "sensitivity": 0.5447646745469671 + }, + { + "name": "model.layers.30.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1320262274239212e-05, + "sensitivity": 1.4163730000425874 + }, + { + "name": "model.layers.30.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0273743100697175e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0776026657549664e-05, + "sensitivity": 0.8746320371225154 + }, + { + "name": "model.layers.30.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 3.4489867175580002e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.299735342603526e-06, + "sensitivity": 2.1024977629783432 + }, + { + "name": "model.layers.30.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2669231637119083e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.30.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.929786321852589e-06, + "sensitivity": 2.106870270311985 + }, + { + "name": "model.layers.30.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 3.6172932595945895e-05, + "sensitivity": 1.9474194293608793 + }, + { + "name": "model.layers.30.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00020695090643130243, + "sensitivity": 0.9157667066935129 + }, + { + "name": "model.layers.30.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.4540173651766963e-05, + "sensitivity": 1.0612963919674225 + }, + { + "name": "model.layers.30.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.5201999202836305e-05, + "sensitivity": 0.6605952275194953 + }, + { + "name": "model.layers.30.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0003148860123474151, + "sensitivity": 0.7093501681741063 + }, + { + "name": "model.layers.31.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8468263887334615e-05, + "sensitivity": 0.7704368753166795 + }, + { + "name": "model.layers.31.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.081580856218352e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006674011237919331, + "sensitivity": 0.5529444141700486 + }, + { + "name": "model.layers.31.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.511792889796197e-05, + "sensitivity": 0.6415341005553679 + }, + { + "name": "model.layers.31.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.7204504123074e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007301999139599502, + "sensitivity": 0.5286666147702828 + }, + { + "name": "model.layers.31.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.619533476419747e-05, + "sensitivity": 0.8940571967045164 + }, + { + "name": "model.layers.31.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.339020496350713e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006201354553923011, + "sensitivity": 0.5290649406384328 + }, + { + "name": "model.layers.31.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.349934119498357e-05, + "sensitivity": 0.6277061001064559 + }, + { + "name": "model.layers.31.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.017706593615003e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007138755172491074, + "sensitivity": 0.5469204769421583 + }, + { + "name": "model.layers.31.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.684990173904225e-05, + "sensitivity": 1.1979168465733443 + }, + { + "name": "model.layers.31.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1360696134943282e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.610445441561751e-05, + "sensitivity": 1.0133012421606187 + }, + { + "name": "model.layers.31.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.827905599493533e-05, + "sensitivity": 0.6365132678327916 + }, + { + "name": "model.layers.31.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.839330914473976e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007780664600431919, + "sensitivity": 0.5254554889456059 + }, + { + "name": "model.layers.31.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.177544128149748e-05, + "sensitivity": 0.652042736836698 + }, + { + "name": "model.layers.31.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.562518587496015e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006849101046100259, + "sensitivity": 0.5229993940747226 + }, + { + "name": "model.layers.31.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8996094594476745e-05, + "sensitivity": 0.9001274458719446 + }, + { + "name": "model.layers.31.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.080515729285253e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006580407498404384, + "sensitivity": 0.5584736089117935 + }, + { + "name": "model.layers.31.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.3075146853225306e-05, + "sensitivity": 1.3283786793144876 + }, + { + "name": "model.layers.31.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.401481313223485e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.425007061101496e-05, + "sensitivity": 0.8093269055792073 + }, + { + "name": "model.layers.31.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1304039617243689e-05, + "sensitivity": 1.6346502932725566 + }, + { + "name": "model.layers.31.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.8674481907510199e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006828908808529377, + "sensitivity": 0.5795146250480949 + }, + { + "name": "model.layers.31.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.022580782882869e-05, + "sensitivity": 0.7738845698542013 + }, + { + "name": "model.layers.31.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.406168040484772e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006686788401566446, + "sensitivity": 0.5631080963940606 + }, + { + "name": "model.layers.31.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.375870725605637e-05, + "sensitivity": 0.9030434653779285 + }, + { + "name": "model.layers.31.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.460939741577022e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.35336764389649e-05, + "sensitivity": 0.6671240378049691 + }, + { + "name": "model.layers.31.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8716843341244385e-05, + "sensitivity": 0.8648350763376629 + }, + { + "name": "model.layers.31.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.855777314740408e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006524638156406581, + "sensitivity": 0.5290384567532244 + }, + { + "name": "model.layers.31.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.607050843536854e-05, + "sensitivity": 0.894590257243086 + }, + { + "name": "model.layers.31.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.24347694106109e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006378382677212358, + "sensitivity": 0.5207844009303269 + }, + { + "name": "model.layers.31.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7830642617773265e-05, + "sensitivity": 0.6231027577611008 + }, + { + "name": "model.layers.31.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.521796305809403e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006521535106003284, + "sensitivity": 0.539107912431757 + }, + { + "name": "model.layers.31.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.558683526236564e-05, + "sensitivity": 0.6299234225508884 + }, + { + "name": "model.layers.31.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0819728686328745e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007361457101069391, + "sensitivity": 0.5116815001425605 + }, + { + "name": "model.layers.31.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.356211088132113e-05, + "sensitivity": 0.7695195594767232 + }, + { + "name": "model.layers.31.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.574600431325962e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007274709641933441, + "sensitivity": 0.5268401927394826 + }, + { + "name": "model.layers.31.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.971819336991757e-05, + "sensitivity": 0.6334547217803769 + }, + { + "name": "model.layers.31.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.814804578425537e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006592515856027603, + "sensitivity": 0.5430403162978247 + }, + { + "name": "model.layers.31.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.718471948057413e-05, + "sensitivity": 0.8860518885336821 + }, + { + "name": "model.layers.31.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.698481567786075e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006593194557353854, + "sensitivity": 0.5629133412569021 + }, + { + "name": "model.layers.31.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.433457019738853e-05, + "sensitivity": 1.1254282613929973 + }, + { + "name": "model.layers.31.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1986179515588447e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007379350136034191, + "sensitivity": 0.5787052113683426 + }, + { + "name": "model.layers.31.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.243315147003159e-05, + "sensitivity": 1.1387711831125709 + }, + { + "name": "model.layers.31.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.299813091776741e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007094683824107051, + "sensitivity": 0.5533504954977201 + }, + { + "name": "model.layers.31.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.487010978162289e-05, + "sensitivity": 0.8870397562972074 + }, + { + "name": "model.layers.31.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.845452950685285e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007366963545791805, + "sensitivity": 0.5820904974332545 + }, + { + "name": "model.layers.31.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7183449825970456e-05, + "sensitivity": 0.656502066192816 + }, + { + "name": "model.layers.31.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.973290164249192e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006509209633804858, + "sensitivity": 0.5411742853127636 + }, + { + "name": "model.layers.31.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1323614671709947e-05, + "sensitivity": 1.3312245108474534 + }, + { + "name": "model.layers.31.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.52450057209353e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.21297222096473e-05, + "sensitivity": 0.709557071624678 + }, + { + "name": "model.layers.31.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1298370736767538e-05, + "sensitivity": 1.4353513722909486 + }, + { + "name": "model.layers.31.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.637795758659195e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.1371079381206073e-05, + "sensitivity": 1.2417765141231936 + }, + { + "name": "model.layers.31.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0344551457092166e-05, + "sensitivity": 0.651280011400859 + }, + { + "name": "model.layers.31.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.368881031448836e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006832012441009283, + "sensitivity": 0.5449003469395284 + }, + { + "name": "model.layers.31.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.100889731897041e-05, + "sensitivity": 0.6805697676640046 + }, + { + "name": "model.layers.31.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.011695851768309e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006746221333742142, + "sensitivity": 0.5539541937754147 + }, + { + "name": "model.layers.31.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.130707333795726e-05, + "sensitivity": 0.898342347826991 + }, + { + "name": "model.layers.31.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.560184028283402e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.240061338758096e-05, + "sensitivity": 0.699196286363331 + }, + { + "name": "model.layers.31.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.455281254602596e-05, + "sensitivity": 0.6060145630080613 + }, + { + "name": "model.layers.31.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.114626328075246e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007253969088196754, + "sensitivity": 0.5264872277296274 + }, + { + "name": "model.layers.31.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.352518539642915e-05, + "sensitivity": 0.9021443910946008 + }, + { + "name": "model.layers.31.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.693615202697401e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007116659544408321, + "sensitivity": 0.5444819090803857 + }, + { + "name": "model.layers.31.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.693281855201349e-05, + "sensitivity": 0.8406657801146122 + }, + { + "name": "model.layers.31.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.154355800281337e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000648379442282021, + "sensitivity": 0.5485529437568162 + }, + { + "name": "model.layers.31.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.49531721137464e-05, + "sensitivity": 0.8533022512698942 + }, + { + "name": "model.layers.31.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0707019555411534e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007387680816464126, + "sensitivity": 0.5947496587679157 + }, + { + "name": "model.layers.31.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0446146916365251e-05, + "sensitivity": 1.8687426565065384 + }, + { + "name": "model.layers.31.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.578119263802364e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.948282341705635e-05, + "sensitivity": 0.8644843626500631 + }, + { + "name": "model.layers.31.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006728979060426354, + "sensitivity": 0.5286270315974673 + }, + { + "name": "model.layers.31.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.810951163060963e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006890149670653045, + "sensitivity": 0.5334115081374763 + }, + { + "name": "model.layers.31.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0842823940038215e-05, + "sensitivity": 1.2807508756914276 + }, + { + "name": "model.layers.31.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6346336906281067e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006495722918771207, + "sensitivity": 0.5898554595158239 + }, + { + "name": "model.layers.31.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.640401261392981e-05, + "sensitivity": 0.9279391272750697 + }, + { + "name": "model.layers.31.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.424829047726234e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.593161378987134e-05, + "sensitivity": 0.781532215612114 + }, + { + "name": "model.layers.31.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4921521344367648e-06, + "sensitivity": 2.0377173950635514 + }, + { + "name": "model.layers.31.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.517529413940792e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007034411537460983, + "sensitivity": 0.5831895966959659 + }, + { + "name": "model.layers.31.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007116184569895267, + "sensitivity": 0.5167591744493841 + }, + { + "name": "model.layers.31.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.56876908983395e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007220436818897724, + "sensitivity": 0.538829350031002 + }, + { + "name": "model.layers.31.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.998825508868322e-05, + "sensitivity": 1.0081319464927576 + }, + { + "name": "model.layers.31.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0649193882272812e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.948321631876752e-05, + "sensitivity": 0.7711673381502773 + }, + { + "name": "model.layers.31.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.886694270884618e-05, + "sensitivity": 0.8075581139603659 + }, + { + "name": "model.layers.31.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.013052155940386e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.973217048449442e-05, + "sensitivity": 0.673664175340692 + }, + { + "name": "model.layers.31.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.21599901933223e-05, + "sensitivity": 0.6508413306085191 + }, + { + "name": "model.layers.31.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.250984819824225e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.1500642914325e-05, + "sensitivity": 0.6049076723641859 + }, + { + "name": "model.layers.31.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006808378966525197, + "sensitivity": 0.5208643844970862 + }, + { + "name": "model.layers.31.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.783395747333998e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006754760397598147, + "sensitivity": 0.538272997584305 + }, + { + "name": "model.layers.31.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007046404061838984, + "sensitivity": 0.568389341079643 + }, + { + "name": "model.layers.31.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.029593120932986e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007014821167103946, + "sensitivity": 0.5339323282858275 + }, + { + "name": "model.layers.31.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006812801002524793, + "sensitivity": 0.5453009281263134 + }, + { + "name": "model.layers.31.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.037923523967038e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007010138942860067, + "sensitivity": 0.5404320787283657 + }, + { + "name": "model.layers.31.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.81870078551583e-05, + "sensitivity": 0.7702119661717827 + }, + { + "name": "model.layers.31.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.47266846903949e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008017338695935905, + "sensitivity": 0.5350504548180041 + }, + { + "name": "model.layers.31.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.913656059419736e-05, + "sensitivity": 0.7901492028913242 + }, + { + "name": "model.layers.31.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.042073543241713e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006699702935293317, + "sensitivity": 0.5503786042450737 + }, + { + "name": "model.layers.31.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.406678585335612e-05, + "sensitivity": 0.7009094963382627 + }, + { + "name": "model.layers.31.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.659405577622238e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007090986473485827, + "sensitivity": 0.5265877850917609 + }, + { + "name": "model.layers.31.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.886701910640113e-05, + "sensitivity": 0.7843673569548426 + }, + { + "name": "model.layers.31.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.284968776526512e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000662897014990449, + "sensitivity": 0.526075505707002 + }, + { + "name": "model.layers.31.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006759184179827571, + "sensitivity": 0.5187657813125973 + }, + { + "name": "model.layers.31.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.443279971790616e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006654299795627594, + "sensitivity": 0.5557285372885824 + }, + { + "name": "model.layers.31.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007128709694370627, + "sensitivity": 0.5862122609632472 + }, + { + "name": "model.layers.31.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.851219265830878e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007100088405422866, + "sensitivity": 0.5321009028753962 + }, + { + "name": "model.layers.31.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.917869202676229e-05, + "sensitivity": 0.7439762383398979 + }, + { + "name": "model.layers.31.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0575116675681784e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8772682677954435e-05, + "sensitivity": 0.6697990741169153 + }, + { + "name": "model.layers.31.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.267271237447858e-05, + "sensitivity": 0.6693018300641805 + }, + { + "name": "model.layers.31.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0351918717788067e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007131524616852403, + "sensitivity": 0.5553862804516791 + }, + { + "name": "model.layers.31.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.571525980485603e-05, + "sensitivity": 0.7593574912346379 + }, + { + "name": "model.layers.31.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.50231811505364e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006214475142769516, + "sensitivity": 0.5186585832806565 + }, + { + "name": "model.layers.31.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007052220171317458, + "sensitivity": 0.5543268492316018 + }, + { + "name": "model.layers.31.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.105981580934895e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007125932606868446, + "sensitivity": 0.5515786949927082 + }, + { + "name": "model.layers.31.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006962413317523897, + "sensitivity": 0.5385200483808844 + }, + { + "name": "model.layers.31.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.852926273699268e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006926399655640125, + "sensitivity": 0.5405527167675919 + }, + { + "name": "model.layers.31.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.170654523884878e-05, + "sensitivity": 1.1100872987952222 + }, + { + "name": "model.layers.31.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.091602469699865e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006956871366128325, + "sensitivity": 0.5360212011740967 + }, + { + "name": "model.layers.31.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.15095705143176e-05, + "sensitivity": 0.6811563517245001 + }, + { + "name": "model.layers.31.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.374716801678005e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007062244112603366, + "sensitivity": 0.5287654391470051 + }, + { + "name": "model.layers.31.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3609932213730644e-06, + "sensitivity": 2.023153175088108 + }, + { + "name": "model.layers.31.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.27149473883037e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006437036208808422, + "sensitivity": 0.5416564376507254 + }, + { + "name": "model.layers.31.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.237586785573512e-05, + "sensitivity": 0.7100317415014715 + }, + { + "name": "model.layers.31.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2045081803080393e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007157950894907117, + "sensitivity": 0.5899702485633888 + }, + { + "name": "model.layers.31.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006820306880399585, + "sensitivity": 0.5833699612789833 + }, + { + "name": "model.layers.31.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.224387784139253e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006842842558398843, + "sensitivity": 0.5018189453865229 + }, + { + "name": "model.layers.31.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007270959904417396, + "sensitivity": 0.5259081677053208 + }, + { + "name": "model.layers.31.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.301316031771421e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007231729105114937, + "sensitivity": 0.5514941835225439 + }, + { + "name": "model.layers.31.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1107618774985895e-05, + "sensitivity": 1.4002047695620259 + }, + { + "name": "model.layers.31.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.255491497431649e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006731553003191948, + "sensitivity": 0.5585212465689661 + }, + { + "name": "model.layers.31.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1154217645525932e-05, + "sensitivity": 1.4385724265204927 + }, + { + "name": "model.layers.31.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.069547223181871e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006714066839776933, + "sensitivity": 0.5192027185299167 + }, + { + "name": "model.layers.31.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007347787613980472, + "sensitivity": 0.5125204700049452 + }, + { + "name": "model.layers.31.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.318411346408539e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007288306951522827, + "sensitivity": 0.587615550700303 + }, + { + "name": "model.layers.31.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 3.210554496035911e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.2065328266762663e-06, + "sensitivity": 2.1003828096964607 + }, + { + "name": "model.layers.31.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0882532706091297e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.31.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.7383321164743393e-06, + "sensitivity": 2.1022655755006223 + }, + { + "name": "model.layers.31.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 3.1080002372618765e-05, + "sensitivity": 1.843732268177789 + }, + { + "name": "model.layers.31.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00022236672521103173, + "sensitivity": 1.0170271287880843 + }, + { + "name": "model.layers.31.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.5215414350677747e-05, + "sensitivity": 1.6214888361845718 + }, + { + "name": "model.layers.31.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 4.782108590006828e-05, + "sensitivity": 0.7004973790226638 + }, + { + "name": "model.layers.31.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00032895314507186413, + "sensitivity": 0.9240737662961647 + }, + { + "name": "model.layers.32.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.606420381809585e-05, + "sensitivity": 0.9649362148635467 + }, + { + "name": "model.layers.32.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.942946578827105e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006692299502901733, + "sensitivity": 0.5460937836512545 + }, + { + "name": "model.layers.32.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.264478724915534e-05, + "sensitivity": 0.6099876155725494 + }, + { + "name": "model.layers.32.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.525389603164513e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007197638042271137, + "sensitivity": 0.5200105510464363 + }, + { + "name": "model.layers.32.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.177735485835001e-05, + "sensitivity": 0.6629840281453379 + }, + { + "name": "model.layers.32.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.793670420142007e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006975379656068981, + "sensitivity": 0.5561546745096749 + }, + { + "name": "model.layers.32.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0763587852125056e-05, + "sensitivity": 1.2589342310986502 + }, + { + "name": "model.layers.32.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0428508403492742e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006716895732097328, + "sensitivity": 0.5662512122030134 + }, + { + "name": "model.layers.32.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7890323660103604e-05, + "sensitivity": 0.6347098733428269 + }, + { + "name": "model.layers.32.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.321653245322523e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006427511107176542, + "sensitivity": 0.5346122988248505 + }, + { + "name": "model.layers.32.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0927504263236187e-05, + "sensitivity": 1.501595800691353 + }, + { + "name": "model.layers.32.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.199421810990316e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006697450298815966, + "sensitivity": 0.5411569095923207 + }, + { + "name": "model.layers.32.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8642639487516135e-05, + "sensitivity": 1.1739049069702896 + }, + { + "name": "model.layers.32.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0378830666013528e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.792958472738974e-05, + "sensitivity": 0.6776969188811238 + }, + { + "name": "model.layers.32.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.162956560729071e-05, + "sensitivity": 0.6174896995213673 + }, + { + "name": "model.layers.32.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.686778644711012e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000701658776961267, + "sensitivity": 0.5410541531080846 + }, + { + "name": "model.layers.32.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0450092860264704e-05, + "sensitivity": 1.1273146457985566 + }, + { + "name": "model.layers.32.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.025373290365678e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006752379122190177, + "sensitivity": 0.5294148411093001 + }, + { + "name": "model.layers.32.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0923674381047022e-05, + "sensitivity": 1.2377859391467771 + }, + { + "name": "model.layers.32.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1817268159575178e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.853161565028131e-05, + "sensitivity": 0.6383737555960157 + }, + { + "name": "model.layers.32.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.48640125291422e-05, + "sensitivity": 0.8251090696989805 + }, + { + "name": "model.layers.32.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.488242085353704e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007383585325442255, + "sensitivity": 0.5300407158467315 + }, + { + "name": "model.layers.32.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.207423575688154e-05, + "sensitivity": 0.7946880630124619 + }, + { + "name": "model.layers.32.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.779234240639198e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.178009061841294e-05, + "sensitivity": 0.607340278864307 + }, + { + "name": "model.layers.32.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.113674317020923e-05, + "sensitivity": 0.6132008277580436 + }, + { + "name": "model.layers.32.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.503631872576079e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006904994370415807, + "sensitivity": 0.4919487280778674 + }, + { + "name": "model.layers.32.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.943081825738773e-05, + "sensitivity": 0.7095702993013553 + }, + { + "name": "model.layers.32.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.344419388260576e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007908889092504978, + "sensitivity": 0.528887365592974 + }, + { + "name": "model.layers.32.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.227463018149137e-05, + "sensitivity": 0.633281353503186 + }, + { + "name": "model.layers.32.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4148527043289505e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.405655585695058e-05, + "sensitivity": 0.7681167398438503 + }, + { + "name": "model.layers.32.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1613003152888268e-05, + "sensitivity": 1.4652860008941089 + }, + { + "name": "model.layers.32.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5658297343179584e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.480098818428814e-05, + "sensitivity": 0.6678229223136656 + }, + { + "name": "model.layers.32.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.223351682710927e-05, + "sensitivity": 1.2602449860418625 + }, + { + "name": "model.layers.32.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2119387520215241e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.807866884628311e-05, + "sensitivity": 0.9876875747720937 + }, + { + "name": "model.layers.32.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.837734690634534e-05, + "sensitivity": 0.7889816088325164 + }, + { + "name": "model.layers.32.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.310826953878859e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007940231589600444, + "sensitivity": 0.5613844542270392 + }, + { + "name": "model.layers.32.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.75334343011491e-05, + "sensitivity": 0.8937335580408019 + }, + { + "name": "model.layers.32.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.304001883312594e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006605214439332485, + "sensitivity": 0.5664894246302907 + }, + { + "name": "model.layers.32.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.292965215630829e-05, + "sensitivity": 0.6327678393903684 + }, + { + "name": "model.layers.32.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.056773938529659e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005934405489824712, + "sensitivity": 0.5736928104195572 + }, + { + "name": "model.layers.32.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.077988235920202e-05, + "sensitivity": 1.607922855116103 + }, + { + "name": "model.layers.32.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.693185691299732e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006635033059865236, + "sensitivity": 0.5264583360594192 + }, + { + "name": "model.layers.32.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.262138776946813e-05, + "sensitivity": 1.0255864866149005 + }, + { + "name": "model.layers.32.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1951515261898749e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007082329830154777, + "sensitivity": 0.5386833049611613 + }, + { + "name": "model.layers.32.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.717349631595425e-05, + "sensitivity": 1.1645337476644635 + }, + { + "name": "model.layers.32.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.063376203092048e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6595290516270325e-05, + "sensitivity": 0.6741938063173372 + }, + { + "name": "model.layers.32.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006903344765305519, + "sensitivity": 0.5904269513248983 + }, + { + "name": "model.layers.32.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.936674132404733e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006825685268267989, + "sensitivity": 0.575232272570484 + }, + { + "name": "model.layers.32.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4613337852060795e-05, + "sensitivity": 0.8231950585458379 + }, + { + "name": "model.layers.32.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.90253125160234e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.697091546608135e-05, + "sensitivity": 0.9315570205131368 + }, + { + "name": "model.layers.32.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.956495806458406e-05, + "sensitivity": 0.9557852232681884 + }, + { + "name": "model.layers.32.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0277642559231026e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.93583972658962e-05, + "sensitivity": 0.6632908220734861 + }, + { + "name": "model.layers.32.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.818991849082522e-05, + "sensitivity": 0.788923386559863 + }, + { + "name": "model.layers.32.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.086329899015254e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006477299029938877, + "sensitivity": 0.5401601777353245 + }, + { + "name": "model.layers.32.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.930311090196483e-05, + "sensitivity": 0.976002747168798 + }, + { + "name": "model.layers.32.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0261964007440838e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006750712636858225, + "sensitivity": 0.5635334888929803 + }, + { + "name": "model.layers.32.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.726619201595895e-05, + "sensitivity": 0.641452012568015 + }, + { + "name": "model.layers.32.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.734861012271722e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006624259403906763, + "sensitivity": 0.544644950746431 + }, + { + "name": "model.layers.32.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.987042823107913e-05, + "sensitivity": 0.8828869072055597 + }, + { + "name": "model.layers.32.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1114946119050728e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006926789646968246, + "sensitivity": 0.5418076702668061 + }, + { + "name": "model.layers.32.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.834604235133156e-05, + "sensitivity": 0.7405520023711487 + }, + { + "name": "model.layers.32.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.418398351750511e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006570319528691471, + "sensitivity": 0.5141282953767896 + }, + { + "name": "model.layers.32.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.156949191587046e-05, + "sensitivity": 0.6975456027996739 + }, + { + "name": "model.layers.32.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.852090675442014e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005866794381290674, + "sensitivity": 0.5355309593464829 + }, + { + "name": "model.layers.32.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1322632417432033e-05, + "sensitivity": 1.6692574026486922 + }, + { + "name": "model.layers.32.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.513217284809798e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.322185072349384e-05, + "sensitivity": 1.009470402418739 + }, + { + "name": "model.layers.32.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.60502776352223e-05, + "sensitivity": 0.9767531550004218 + }, + { + "name": "model.layers.32.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.238066809302836e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006358891259878874, + "sensitivity": 0.5474379857543366 + }, + { + "name": "model.layers.32.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.143245263956487e-05, + "sensitivity": 0.6645565415599884 + }, + { + "name": "model.layers.32.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.034397428156808e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006905384361743927, + "sensitivity": 0.536319254804999 + }, + { + "name": "model.layers.32.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006973270210437477, + "sensitivity": 0.5914682546704799 + }, + { + "name": "model.layers.32.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.33702870295383e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006880580331198871, + "sensitivity": 0.5122294213799852 + }, + { + "name": "model.layers.32.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.46451226202771e-05, + "sensitivity": 0.6096137852475064 + }, + { + "name": "model.layers.32.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0226520998912747e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007687066681683064, + "sensitivity": 0.5449326301095927 + }, + { + "name": "model.layers.32.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.88187322136946e-05, + "sensitivity": 1.1217431541954221 + }, + { + "name": "model.layers.32.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.720090025031823e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006576607702299953, + "sensitivity": 0.5255462002375895 + }, + { + "name": "model.layers.32.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.061435068550054e-05, + "sensitivity": 1.3791163924063794 + }, + { + "name": "model.layers.32.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4111644759395858e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.700270412489772e-05, + "sensitivity": 0.6867830933798955 + }, + { + "name": "model.layers.32.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.149924355559051e-05, + "sensitivity": 1.6517615031878943 + }, + { + "name": "model.layers.32.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2194500413897913e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007148664444684982, + "sensitivity": 0.5783521112848677 + }, + { + "name": "model.layers.32.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.497354479506612e-05, + "sensitivity": 0.8692732489609256 + }, + { + "name": "model.layers.32.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.327180012202007e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.663645035587251e-05, + "sensitivity": 0.6413145332981645 + }, + { + "name": "model.layers.32.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.786193651147187e-05, + "sensitivity": 0.9475612173446171 + }, + { + "name": "model.layers.32.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.365259418496862e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006625970709137619, + "sensitivity": 0.5255912123004578 + }, + { + "name": "model.layers.32.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0621602996252477e-05, + "sensitivity": 1.3041878290975055 + }, + { + "name": "model.layers.32.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.459179076045984e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00066731235710904, + "sensitivity": 0.5554847187382739 + }, + { + "name": "model.layers.32.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1093470675405115e-05, + "sensitivity": 1.6966364016660584 + }, + { + "name": "model.layers.32.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.985550152829092e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006767305894754827, + "sensitivity": 0.5519867812408302 + }, + { + "name": "model.layers.32.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.912702908972278e-05, + "sensitivity": 1.1945746090293157 + }, + { + "name": "model.layers.32.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.29153884499101e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006620024796575308, + "sensitivity": 0.5961163561237249 + }, + { + "name": "model.layers.32.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.641099753323942e-05, + "sensitivity": 0.7618022512305784 + }, + { + "name": "model.layers.32.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.094386091921479e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007610111497342587, + "sensitivity": 0.543890354517218 + }, + { + "name": "model.layers.32.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0864898285944946e-05, + "sensitivity": 1.3278826991831658 + }, + { + "name": "model.layers.32.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.485449262072507e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006556726293638349, + "sensitivity": 0.5221055768649021 + }, + { + "name": "model.layers.32.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0852518244064413e-05, + "sensitivity": 1.5022062002047027 + }, + { + "name": "model.layers.32.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6679796317475848e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8271409216104075e-05, + "sensitivity": 0.7848804845523457 + }, + { + "name": "model.layers.32.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.118597957538441e-05, + "sensitivity": 0.7279647885219872 + }, + { + "name": "model.layers.32.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.100060201992164e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006762716802768409, + "sensitivity": 0.5568235860719813 + }, + { + "name": "model.layers.32.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0816091718152165e-05, + "sensitivity": 1.1811710406826106 + }, + { + "name": "model.layers.32.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.248739848364494e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006897016428411007, + "sensitivity": 0.5520486158114044 + }, + { + "name": "model.layers.32.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.088835961127188e-05, + "sensitivity": 1.431903240480181 + }, + { + "name": "model.layers.32.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.901120173097297e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.988491466268897e-05, + "sensitivity": 0.6567586809324092 + }, + { + "name": "model.layers.32.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0976272278639954e-05, + "sensitivity": 1.6874613005047479 + }, + { + "name": "model.layers.32.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.027610096571152e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.808612331748009e-05, + "sensitivity": 0.6295627774539856 + }, + { + "name": "model.layers.32.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6672259233891964e-05, + "sensitivity": 1.1628600132126823 + }, + { + "name": "model.layers.32.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.664439405947633e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7695531722856686e-05, + "sensitivity": 0.6720524465342259 + }, + { + "name": "model.layers.32.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.770161341293715e-06, + "sensitivity": 1.4911669168210928 + }, + { + "name": "model.layers.32.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.8191164953314e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5719472584314644e-05, + "sensitivity": 0.6040836071643793 + }, + { + "name": "model.layers.32.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.729196345782839e-05, + "sensitivity": 0.750060990485751 + }, + { + "name": "model.layers.32.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.850198239291785e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006503543118014932, + "sensitivity": 0.568819311109846 + }, + { + "name": "model.layers.32.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.162931094877422e-05, + "sensitivity": 0.7559608344590685 + }, + { + "name": "model.layers.32.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.729560707048222e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006857152911834419, + "sensitivity": 0.5387041399548603 + }, + { + "name": "model.layers.32.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0470132110640407e-05, + "sensitivity": 1.6138631517426663 + }, + { + "name": "model.layers.32.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0311041478416882e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006508991355076432, + "sensitivity": 0.5960613613684032 + }, + { + "name": "model.layers.32.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.801668157801032e-05, + "sensitivity": 0.9609576704625854 + }, + { + "name": "model.layers.32.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0155936251976527e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.880543903913349e-05, + "sensitivity": 0.6126103347116535 + }, + { + "name": "model.layers.32.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.923404387431219e-05, + "sensitivity": 0.9117298660508 + }, + { + "name": "model.layers.32.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.553265959359123e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006588222458958626, + "sensitivity": 0.5224879816870988 + }, + { + "name": "model.layers.32.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.300793756963685e-05, + "sensitivity": 1.1258251176220837 + }, + { + "name": "model.layers.32.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.623611963936128e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.425791070796549e-05, + "sensitivity": 0.6552531582772733 + }, + { + "name": "model.layers.32.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.612989091081545e-05, + "sensitivity": 0.7769363950520056 + }, + { + "name": "model.layers.32.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0204964837612351e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.777502130717039e-05, + "sensitivity": 0.6203038813845021 + }, + { + "name": "model.layers.32.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1042657206417061e-05, + "sensitivity": 1.4944535653989512 + }, + { + "name": "model.layers.32.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1706025588864577e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006827153265476227, + "sensitivity": 0.5392869724940161 + }, + { + "name": "model.layers.32.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.2736039682058617e-06, + "sensitivity": 2.0972518681062153 + }, + { + "name": "model.layers.32.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.123725029283378e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006308412412181497, + "sensitivity": 0.5320360514649368 + }, + { + "name": "model.layers.32.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.597793253604323e-05, + "sensitivity": 0.699485763742341 + }, + { + "name": "model.layers.32.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2323173450567992e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.563225178979337e-05, + "sensitivity": 0.6569452509575985 + }, + { + "name": "model.layers.32.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 2.9369743970164564e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.440627440591925e-06, + "sensitivity": 2.1015494996697015 + }, + { + "name": "model.layers.32.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3235816140877432e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.32.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.6230035271291854e-06, + "sensitivity": 2.10147411484859 + }, + { + "name": "model.layers.32.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 4.29903193435166e-05, + "sensitivity": 1.8097854934768456 + }, + { + "name": "model.layers.32.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00022153585450723767, + "sensitivity": 1.1512106715504524 + }, + { + "name": "model.layers.32.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.786085522326175e-05, + "sensitivity": 1.5227144173150438 + }, + { + "name": "model.layers.32.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.2333456551423296e-05, + "sensitivity": 0.7690258458586214 + }, + { + "name": "model.layers.32.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0003518016601447016, + "sensitivity": 0.7687551116241086 + }, + { + "name": "model.layers.33.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0935173122561537e-05, + "sensitivity": 1.357327172259768 + }, + { + "name": "model.layers.33.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.705648729621316e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006763027049601078, + "sensitivity": 0.5425801130602861 + }, + { + "name": "model.layers.33.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4263597121462226e-05, + "sensitivity": 0.7615885643962059 + }, + { + "name": "model.layers.33.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.873074423514481e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006472980603575706, + "sensitivity": 0.5780588861750796 + }, + { + "name": "model.layers.33.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.469827349064872e-05, + "sensitivity": 0.6798072314704586 + }, + { + "name": "model.layers.33.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.03966599960404e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007459461921826005, + "sensitivity": 0.5276968366631059 + }, + { + "name": "model.layers.33.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006316097569651902, + "sensitivity": 0.5349558568507965 + }, + { + "name": "model.layers.33.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.361397026921622e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006321565015241504, + "sensitivity": 0.5458833379534402 + }, + { + "name": "model.layers.33.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.135971489129588e-05, + "sensitivity": 0.7460046571106476 + }, + { + "name": "model.layers.33.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.168358706621802e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007078958442434669, + "sensitivity": 0.5368272350668164 + }, + { + "name": "model.layers.33.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.729952681576833e-05, + "sensitivity": 1.005330055097516 + }, + { + "name": "model.layers.33.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.819968234594853e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006445999606512487, + "sensitivity": 0.5786093229507147 + }, + { + "name": "model.layers.33.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.260191003093496e-05, + "sensitivity": 0.6770907701562731 + }, + { + "name": "model.layers.33.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.043189058691496e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007033710135146976, + "sensitivity": 0.5313038625979651 + }, + { + "name": "model.layers.33.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.838399374624714e-05, + "sensitivity": 0.8270816930553891 + }, + { + "name": "model.layers.33.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6106696421047673e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006431511137634516, + "sensitivity": 0.5564183440244777 + }, + { + "name": "model.layers.33.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.270313315326348e-05, + "sensitivity": 0.8369618487093129 + }, + { + "name": "model.layers.33.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.218565656330611e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007056035101413727, + "sensitivity": 0.5030787924748258 + }, + { + "name": "model.layers.33.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.142993824032601e-05, + "sensitivity": 1.2552058876098209 + }, + { + "name": "model.layers.33.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.182852641562931e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.145790393929929e-05, + "sensitivity": 0.6185768920278032 + }, + { + "name": "model.layers.33.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007285535102710128, + "sensitivity": 0.591301711522398 + }, + { + "name": "model.layers.33.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.228709364426322e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007371436222456396, + "sensitivity": 0.5288844679546147 + }, + { + "name": "model.layers.33.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0536215086176526e-05, + "sensitivity": 1.6551706290648724 + }, + { + "name": "model.layers.33.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.28241673186858e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000636975048109889, + "sensitivity": 0.5330480206998189 + }, + { + "name": "model.layers.33.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8517864090390503e-05, + "sensitivity": 0.987096900910117 + }, + { + "name": "model.layers.33.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2603449022208224e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0065674915676937e-05, + "sensitivity": 0.7208401319564457 + }, + { + "name": "model.layers.33.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.103645137045532e-05, + "sensitivity": 0.7341119995284257 + }, + { + "name": "model.layers.33.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.435224915752769e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006838801200501621, + "sensitivity": 0.5234124011691028 + }, + { + "name": "model.layers.33.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.038291520671919e-05, + "sensitivity": 1.2630671169493808 + }, + { + "name": "model.layers.33.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3509536529454635e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5470529332524166e-05, + "sensitivity": 0.6543379455242903 + }, + { + "name": "model.layers.33.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.04270571784582e-05, + "sensitivity": 0.6410350560528156 + }, + { + "name": "model.layers.33.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.754142987119849e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006652912124991417, + "sensitivity": 0.5364102600073827 + }, + { + "name": "model.layers.33.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.664220589096658e-05, + "sensitivity": 1.1753439808706065 + }, + { + "name": "model.layers.33.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.851198802200088e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006533404812216759, + "sensitivity": 0.5644819776062547 + }, + { + "name": "model.layers.33.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.954558193683624e-05, + "sensitivity": 0.9935864562441132 + }, + { + "name": "model.layers.33.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0105986802955158e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008267539087682962, + "sensitivity": 0.5231779749237354 + }, + { + "name": "model.layers.33.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.707211676053703e-05, + "sensitivity": 0.9523878565103993 + }, + { + "name": "model.layers.33.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.620360176792019e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006609453703276813, + "sensitivity": 0.5486342466791894 + }, + { + "name": "model.layers.33.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.981654248898849e-05, + "sensitivity": 1.049382744147329 + }, + { + "name": "model.layers.33.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.144900220941054e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000694672460667789, + "sensitivity": 0.5573886649541657 + }, + { + "name": "model.layers.33.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.840116864419542e-05, + "sensitivity": 0.7007606732434328 + }, + { + "name": "model.layers.33.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.160467134781356e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006809725309722126, + "sensitivity": 0.5245818136462933 + }, + { + "name": "model.layers.33.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.472400855273008e-05, + "sensitivity": 0.7222306268444341 + }, + { + "name": "model.layers.33.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.841855899139773e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007193984347395599, + "sensitivity": 0.5736848635520844 + }, + { + "name": "model.layers.33.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.270361336646602e-05, + "sensitivity": 0.7462664473709852 + }, + { + "name": "model.layers.33.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.332689051509078e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007026779348962009, + "sensitivity": 0.5964102161219762 + }, + { + "name": "model.layers.33.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1540137165866327e-05, + "sensitivity": 1.3200462056435762 + }, + { + "name": "model.layers.33.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2862459470852627e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007162190740928054, + "sensitivity": 0.5665443546093911 + }, + { + "name": "model.layers.33.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.631584983551875e-05, + "sensitivity": 0.6221435639344549 + }, + { + "name": "model.layers.33.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.86304894973e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007309670327231288, + "sensitivity": 0.5288485675752805 + }, + { + "name": "model.layers.33.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006649877759627998, + "sensitivity": 0.5531085070067545 + }, + { + "name": "model.layers.33.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.212170203274582e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006966012879274786, + "sensitivity": 0.5223196463255826 + }, + { + "name": "model.layers.33.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.111067341407761e-05, + "sensitivity": 0.6063809839654098 + }, + { + "name": "model.layers.33.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.369437409783131e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006940590683370829, + "sensitivity": 0.5454365129767295 + }, + { + "name": "model.layers.33.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.365760110478732e-06, + "sensitivity": 2.097621653795591 + }, + { + "name": "model.layers.33.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5414528888868517e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.688913370249793e-05, + "sensitivity": 0.98808022228594 + }, + { + "name": "model.layers.33.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.781790241599083e-05, + "sensitivity": 1.0281725923848852 + }, + { + "name": "model.layers.33.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0554360869718948e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.552550283027813e-05, + "sensitivity": 0.6903858039244625 + }, + { + "name": "model.layers.33.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006442618323490024, + "sensitivity": 0.5155975118527106 + }, + { + "name": "model.layers.33.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.782804007343657e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006780314142815769, + "sensitivity": 0.5487423742330373 + }, + { + "name": "model.layers.33.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.974509258521721e-05, + "sensitivity": 1.1192805685714602 + }, + { + "name": "model.layers.33.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.075738282452221e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006774912471882999, + "sensitivity": 0.5517737643408825 + }, + { + "name": "model.layers.33.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.678359229932539e-05, + "sensitivity": 0.8526137220352447 + }, + { + "name": "model.layers.33.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.300659939981415e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.179579941090196e-05, + "sensitivity": 0.6074110225524557 + }, + { + "name": "model.layers.33.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.734213482355699e-05, + "sensitivity": 1.0822690994136364 + }, + { + "name": "model.layers.33.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.780969776329584e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006309857708401978, + "sensitivity": 0.5839953304638935 + }, + { + "name": "model.layers.33.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7126220781356096e-05, + "sensitivity": 0.9532127577608518 + }, + { + "name": "model.layers.33.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.448053906955465e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006521969335153699, + "sensitivity": 0.5647707353599619 + }, + { + "name": "model.layers.33.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0840587492566556e-05, + "sensitivity": 1.3058036265875321 + }, + { + "name": "model.layers.33.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.547608215143555e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006398960249498487, + "sensitivity": 0.5323489424195229 + }, + { + "name": "model.layers.33.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.301819666987285e-05, + "sensitivity": 0.8448436419194202 + }, + { + "name": "model.layers.33.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.448611990592326e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007058662595227361, + "sensitivity": 0.5115687684135026 + }, + { + "name": "model.layers.33.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007059999625198543, + "sensitivity": 0.5855556406120271 + }, + { + "name": "model.layers.33.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.43421594506799e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000725842546671629, + "sensitivity": 0.5614629736439508 + }, + { + "name": "model.layers.33.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.097492223489098e-05, + "sensitivity": 0.7803281637406261 + }, + { + "name": "model.layers.33.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.959256885849754e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006831944920122623, + "sensitivity": 0.5540704069247394 + }, + { + "name": "model.layers.33.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0611331163090654e-05, + "sensitivity": 1.804780818972745 + }, + { + "name": "model.layers.33.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2348932614258956e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006621351349167526, + "sensitivity": 0.5911216337356009 + }, + { + "name": "model.layers.33.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.907185186515562e-05, + "sensitivity": 0.9186351825095878 + }, + { + "name": "model.layers.33.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.340053909705603e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006756647489964962, + "sensitivity": 0.5442121353797494 + }, + { + "name": "model.layers.33.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006402754806913435, + "sensitivity": 0.5889837128485109 + }, + { + "name": "model.layers.33.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.516291589126922e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006688520079478621, + "sensitivity": 0.5492975247105738 + }, + { + "name": "model.layers.33.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8962494222214445e-05, + "sensitivity": 0.9597710439923124 + }, + { + "name": "model.layers.33.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.995133953249024e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006515582790598273, + "sensitivity": 0.5345284045073841 + }, + { + "name": "model.layers.33.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.266385753406212e-05, + "sensitivity": 0.763485597459077 + }, + { + "name": "model.layers.33.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.129837851811317e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007119818474166095, + "sensitivity": 0.5480128400264495 + }, + { + "name": "model.layers.33.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.014424070599489e-05, + "sensitivity": 0.9767099472132139 + }, + { + "name": "model.layers.33.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.73860642514046e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000660466670524329, + "sensitivity": 0.5348862709773149 + }, + { + "name": "model.layers.33.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0826212575193495e-05, + "sensitivity": 0.6431945885094759 + }, + { + "name": "model.layers.33.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.468199214599736e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000676833325996995, + "sensitivity": 0.5672931860942725 + }, + { + "name": "model.layers.33.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0782342542370316e-05, + "sensitivity": 1.254290353125612 + }, + { + "name": "model.layers.33.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4660097349405987e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006819835398346186, + "sensitivity": 0.5940434178596681 + }, + { + "name": "model.layers.33.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.503813448129222e-06, + "sensitivity": 2.097163744272483 + }, + { + "name": "model.layers.33.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1674818551909993e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007026073872111738, + "sensitivity": 0.5516120981899584 + }, + { + "name": "model.layers.33.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 3.0344267543114256e-06, + "sensitivity": 2.097748487121366 + }, + { + "name": "model.layers.33.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3900751127948752e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.117284985724837e-05, + "sensitivity": 0.8326120800339636 + }, + { + "name": "model.layers.33.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0172751899517607e-05, + "sensitivity": 1.5510321080370402 + }, + { + "name": "model.layers.33.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.529762686113827e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006110860267654061, + "sensitivity": 0.527406858482833 + }, + { + "name": "model.layers.33.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.050019874237478e-05, + "sensitivity": 1.0926827090735687 + }, + { + "name": "model.layers.33.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.249111733159225e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006709519657306373, + "sensitivity": 0.5630642421704241 + }, + { + "name": "model.layers.33.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007128085708245635, + "sensitivity": 0.5714003560040491 + }, + { + "name": "model.layers.33.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.224858791232691e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.416437099687755e-05, + "sensitivity": 0.7218997861590706 + }, + { + "name": "model.layers.33.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7248860684921965e-05, + "sensitivity": 0.8204434380490525 + }, + { + "name": "model.layers.33.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.365882422367577e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006531433900818229, + "sensitivity": 0.5685186197723048 + }, + { + "name": "model.layers.33.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.972789949737489e-05, + "sensitivity": 0.65540285897746 + }, + { + "name": "model.layers.33.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.27271264824958e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006736629875376821, + "sensitivity": 0.5075015005900184 + }, + { + "name": "model.layers.33.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1311136404401623e-05, + "sensitivity": 1.3503657040868013 + }, + { + "name": "model.layers.33.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.215009532046679e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007219213293865323, + "sensitivity": 0.5971190924311695 + }, + { + "name": "model.layers.33.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.284036498982459e-05, + "sensitivity": 0.8509925800705197 + }, + { + "name": "model.layers.33.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.554519238008652e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007166103459894657, + "sensitivity": 0.5647492108672031 + }, + { + "name": "model.layers.33.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.168246909510344e-05, + "sensitivity": 1.04754971877923 + }, + { + "name": "model.layers.33.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.519450034327747e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007020856137387455, + "sensitivity": 0.5334680301849597 + }, + { + "name": "model.layers.33.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0471141649759375e-05, + "sensitivity": 1.3403094610138757 + }, + { + "name": "model.layers.33.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0331198154744925e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000673146394547075, + "sensitivity": 0.5688206150499103 + }, + { + "name": "model.layers.33.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.295336061157286e-05, + "sensitivity": 0.7989876692501868 + }, + { + "name": "model.layers.33.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.549392648797948e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007211660849861801, + "sensitivity": 0.5248376588812804 + }, + { + "name": "model.layers.33.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007112195598892868, + "sensitivity": 0.5255299531752364 + }, + { + "name": "model.layers.33.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.623452802363317e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007234588265419006, + "sensitivity": 0.5439883432967989 + }, + { + "name": "model.layers.33.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.519117596326396e-05, + "sensitivity": 1.0808462741734104 + }, + { + "name": "model.layers.33.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.220356448873645e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.658092024736106e-05, + "sensitivity": 0.6587357752690652 + }, + { + "name": "model.layers.33.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.634475019178353e-05, + "sensitivity": 0.8846579596170361 + }, + { + "name": "model.layers.33.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.141318193731422e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006379438564181328, + "sensitivity": 0.5428039654811827 + }, + { + "name": "model.layers.33.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.922419222770259e-05, + "sensitivity": 0.7394532911512341 + }, + { + "name": "model.layers.33.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.063754310365766e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006797193782404065, + "sensitivity": 0.5173129155920932 + }, + { + "name": "model.layers.33.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.496974674519151e-05, + "sensitivity": 0.782823637961614 + }, + { + "name": "model.layers.33.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.36455831429339e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007271577487699687, + "sensitivity": 0.5261445730604687 + }, + { + "name": "model.layers.33.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.130732799647376e-05, + "sensitivity": 0.7705933063296202 + }, + { + "name": "model.layers.33.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.255551051661314e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006846903706900775, + "sensitivity": 0.5711103829369704 + }, + { + "name": "model.layers.33.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 2.7226280963077443e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3698721633991227e-06, + "sensitivity": 2.1016800938131195 + }, + { + "name": "model.layers.33.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3968805205877288e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.33.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.632758312553051e-06, + "sensitivity": 2.1022399157547405 + }, + { + "name": "model.layers.33.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 3.7790461647091433e-05, + "sensitivity": 1.8815554419241358 + }, + { + "name": "model.layers.33.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 4, + "mse": 3.280419696238823e-05, + "sensitivity": 1.2487906536674969 + }, + { + "name": "model.layers.33.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.4641578673035838e-05, + "sensitivity": 1.3577588312486972 + }, + { + "name": "model.layers.33.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.6579941883683205e-05, + "sensitivity": 0.7668126065899651 + }, + { + "name": "model.layers.33.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002731051354203373, + "sensitivity": 1.1042670175269305 + }, + { + "name": "model.layers.34.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006829413468949497, + "sensitivity": 0.5584614934395276 + }, + { + "name": "model.layers.34.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.036297802187619e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006753777852281928, + "sensitivity": 0.5317845838290897 + }, + { + "name": "model.layers.34.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.931530904490501e-05, + "sensitivity": 1.1392925896592292 + }, + { + "name": "model.layers.34.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3701513807973242e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006764413556084037, + "sensitivity": 0.545735626949245 + }, + { + "name": "model.layers.34.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.071657844586298e-05, + "sensitivity": 0.6819437489607418 + }, + { + "name": "model.layers.34.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1052582067350158e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.988156044622883e-05, + "sensitivity": 0.6260624585106176 + }, + { + "name": "model.layers.34.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.067240610718727e-05, + "sensitivity": 0.7864097756373085 + }, + { + "name": "model.layers.34.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.604682418284938e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006964824860915542, + "sensitivity": 0.5237862097189798 + }, + { + "name": "model.layers.34.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.977919136057608e-05, + "sensitivity": 0.8530142435768685 + }, + { + "name": "model.layers.34.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.60322381615697e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006631655851379037, + "sensitivity": 0.5290823842917889 + }, + { + "name": "model.layers.34.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1024810191884171e-05, + "sensitivity": 1.2127970807378519 + }, + { + "name": "model.layers.34.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2118470067434828e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006850915960967541, + "sensitivity": 0.5190367251247088 + }, + { + "name": "model.layers.34.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.891914770472795e-05, + "sensitivity": 0.8671300125325141 + }, + { + "name": "model.layers.34.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.526129254780244e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.901047188672237e-05, + "sensitivity": 0.8509700505018893 + }, + { + "name": "model.layers.34.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.284750270424411e-05, + "sensitivity": 0.8290409910661871 + }, + { + "name": "model.layers.34.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1059264579671435e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.19568454567343e-05, + "sensitivity": 0.6343809655935064 + }, + { + "name": "model.layers.34.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0026875871699303e-05, + "sensitivity": 1.0101304439991818 + }, + { + "name": "model.layers.34.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3151829989510588e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006810060003772378, + "sensitivity": 0.5908925222330682 + }, + { + "name": "model.layers.34.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0775014743558131e-05, + "sensitivity": 1.3392129917040134 + }, + { + "name": "model.layers.34.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.185024285012332e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006561427726410329, + "sensitivity": 0.5528459900278957 + }, + { + "name": "model.layers.34.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.00069072050973773, + "sensitivity": 0.5241925577246288 + }, + { + "name": "model.layers.34.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.296868602679751e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006842344300821424, + "sensitivity": 0.5416831498821567 + }, + { + "name": "model.layers.34.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.979105925594922e-06, + "sensitivity": 1.2752642815505681 + }, + { + "name": "model.layers.34.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.207587501994567e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006192241562530398, + "sensitivity": 0.5811035863994551 + }, + { + "name": "model.layers.34.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.31433431408368e-05, + "sensitivity": 0.8938001750860358 + }, + { + "name": "model.layers.34.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.217317943286616e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007066546240821481, + "sensitivity": 0.5497553596587273 + }, + { + "name": "model.layers.34.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006927845533937216, + "sensitivity": 0.564905878651085 + }, + { + "name": "model.layers.34.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.293171731565963e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006844573654234409, + "sensitivity": 0.504330812489783 + }, + { + "name": "model.layers.34.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.93304609740153e-05, + "sensitivity": 0.7704084064297073 + }, + { + "name": "model.layers.34.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0487851795915049e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008010459132492542, + "sensitivity": 0.546825816272745 + }, + { + "name": "model.layers.34.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000647950975690037, + "sensitivity": 0.577251538452228 + }, + { + "name": "model.layers.34.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.16106660800142e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006558466702699661, + "sensitivity": 0.5326150193714356 + }, + { + "name": "model.layers.34.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.150404078653082e-05, + "sensitivity": 0.6459202577623311 + }, + { + "name": "model.layers.34.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.19586012110085e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006856656400486827, + "sensitivity": 0.5527380379123148 + }, + { + "name": "model.layers.34.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.131624104455113e-05, + "sensitivity": 1.0503990893228878 + }, + { + "name": "model.layers.34.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1332252825013711e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006885865586809814, + "sensitivity": 0.5524749200829137 + }, + { + "name": "model.layers.34.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1041298421332613e-05, + "sensitivity": 1.3824114948100967 + }, + { + "name": "model.layers.34.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3797606470689061e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.67719507671427e-05, + "sensitivity": 0.7142121584269976 + }, + { + "name": "model.layers.34.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.886844494147226e-05, + "sensitivity": 0.6000506419619632 + }, + { + "name": "model.layers.34.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.644236686450313e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.60132897994481e-05, + "sensitivity": 0.6244844662503733 + }, + { + "name": "model.layers.34.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.364415457937866e-05, + "sensitivity": 0.6925207173937462 + }, + { + "name": "model.layers.34.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.600044114042248e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007013862486928701, + "sensitivity": 0.5107935438276927 + }, + { + "name": "model.layers.34.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.1033962992951274e-05, + "sensitivity": 0.6066415628866513 + }, + { + "name": "model.layers.34.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.752031478958088e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000683712016325444, + "sensitivity": 0.5267787186835615 + }, + { + "name": "model.layers.34.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006350462790578604, + "sensitivity": 0.575240528874233 + }, + { + "name": "model.layers.34.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.441274985671043e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006336045917123556, + "sensitivity": 0.5936785020218015 + }, + { + "name": "model.layers.34.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6771968957036734e-05, + "sensitivity": 0.7487253114328934 + }, + { + "name": "model.layers.34.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.561093641721527e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006328242598101497, + "sensitivity": 0.5666541492314147 + }, + { + "name": "model.layers.34.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.602384382858872e-05, + "sensitivity": 0.610929069134685 + }, + { + "name": "model.layers.34.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.855623493924213e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007826555520296097, + "sensitivity": 0.527796878057574 + }, + { + "name": "model.layers.34.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.778986426070333e-05, + "sensitivity": 0.8510190091623739 + }, + { + "name": "model.layers.34.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3185208445065655e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.986632070038468e-05, + "sensitivity": 0.6598650346842574 + }, + { + "name": "model.layers.34.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.468162635224871e-05, + "sensitivity": 1.0822427346188923 + }, + { + "name": "model.layers.34.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.632360959381913e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6571687309769914e-05, + "sensitivity": 0.6256662928749623 + }, + { + "name": "model.layers.34.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.963783769402653e-05, + "sensitivity": 0.9233260325537411 + }, + { + "name": "model.layers.34.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.799241868473473e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006859648856334388, + "sensitivity": 0.5199387344913411 + }, + { + "name": "model.layers.34.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0361922250012867e-05, + "sensitivity": 1.60893549266336 + }, + { + "name": "model.layers.34.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.432395593947149e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006375653902068734, + "sensitivity": 0.5634235266640369 + }, + { + "name": "model.layers.34.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.28558118478395e-05, + "sensitivity": 0.7943029761258581 + }, + { + "name": "model.layers.34.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.904118663442205e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006989878602325916, + "sensitivity": 0.5293935511423185 + }, + { + "name": "model.layers.34.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.369658512994647e-05, + "sensitivity": 0.6297341304225218 + }, + { + "name": "model.layers.34.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2179381201349315e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007171913748607039, + "sensitivity": 0.5184104410166418 + }, + { + "name": "model.layers.34.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0843216841749381e-05, + "sensitivity": 1.550677434029636 + }, + { + "name": "model.layers.34.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.040831875798176e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006653386517427862, + "sensitivity": 0.5373979560286926 + }, + { + "name": "model.layers.34.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.592248635366559e-05, + "sensitivity": 0.778073973347031 + }, + { + "name": "model.layers.34.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.952473535828176e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8247591368854046e-05, + "sensitivity": 0.6984130742245582 + }, + { + "name": "model.layers.34.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006957526202313602, + "sensitivity": 0.5882787929222644 + }, + { + "name": "model.layers.34.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.036822123358434e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006964132189750671, + "sensitivity": 0.5382874787704783 + }, + { + "name": "model.layers.34.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.937883906881325e-05, + "sensitivity": 0.9176437850053456 + }, + { + "name": "model.layers.34.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0718180192270665e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006613642908632755, + "sensitivity": 0.5835282547770085 + }, + { + "name": "model.layers.34.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.096890865592286e-05, + "sensitivity": 0.782997204661427 + }, + { + "name": "model.layers.34.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0377909802627983e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006891537341289222, + "sensitivity": 0.5104784460412247 + }, + { + "name": "model.layers.34.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.901340045966208e-05, + "sensitivity": 0.8413793374456648 + }, + { + "name": "model.layers.34.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2117359347030288e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006597561296075583, + "sensitivity": 0.5486043686396302 + }, + { + "name": "model.layers.34.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.284756091190502e-05, + "sensitivity": 0.6467190021174656 + }, + { + "name": "model.layers.34.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.857062650553416e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007035612361505628, + "sensitivity": 0.5036219669388441 + }, + { + "name": "model.layers.34.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.496087841398548e-06, + "sensitivity": 1.2802674860081225 + }, + { + "name": "model.layers.34.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.699597522834665e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006123132188804448, + "sensitivity": 0.5232833314292852 + }, + { + "name": "model.layers.34.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1089893632743042e-05, + "sensitivity": 1.2796265002009344 + }, + { + "name": "model.layers.34.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0497179800950107e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000686654238961637, + "sensitivity": 0.5175298080048208 + }, + { + "name": "model.layers.34.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.143735663499683e-05, + "sensitivity": 0.8542935839694386 + }, + { + "name": "model.layers.34.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.401264952022757e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007025508093647659, + "sensitivity": 0.555459099062038 + }, + { + "name": "model.layers.34.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.251924060052261e-05, + "sensitivity": 1.0402341691725987 + }, + { + "name": "model.layers.34.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.413503564952407e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007016884628683329, + "sensitivity": 0.5288570292381354 + }, + { + "name": "model.layers.34.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.026324626873247e-05, + "sensitivity": 0.8735249455414812 + }, + { + "name": "model.layers.34.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.27217411622405e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006938362494111061, + "sensitivity": 0.5158565179578516 + }, + { + "name": "model.layers.34.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7695469877216965e-05, + "sensitivity": 1.0396036625372957 + }, + { + "name": "model.layers.34.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.274718442800804e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006685964181087911, + "sensitivity": 0.5876797986010103 + }, + { + "name": "model.layers.34.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.02435611654073e-05, + "sensitivity": 0.8306153375511661 + }, + { + "name": "model.layers.34.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0204926184087526e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006916669080965221, + "sensitivity": 0.5484602476199112 + }, + { + "name": "model.layers.34.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.116371514508501e-05, + "sensitivity": 0.6052211373571832 + }, + { + "name": "model.layers.34.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.544749903194315e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006974179996177554, + "sensitivity": 0.5060268771486348 + }, + { + "name": "model.layers.34.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.543830047827214e-05, + "sensitivity": 0.7537996899245423 + }, + { + "name": "model.layers.34.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0005271633417578e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.83422151976265e-05, + "sensitivity": 0.6761535158931652 + }, + { + "name": "model.layers.34.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.083389598643407e-05, + "sensitivity": 0.8061945577259915 + }, + { + "name": "model.layers.34.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3191265679779463e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9778947615996e-05, + "sensitivity": 0.6580110391886917 + }, + { + "name": "model.layers.34.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.482884055003524e-05, + "sensitivity": 0.6975968733266807 + }, + { + "name": "model.layers.34.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.411093060407438e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007357471040450037, + "sensitivity": 0.5170275108354271 + }, + { + "name": "model.layers.34.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1005911801476032e-05, + "sensitivity": 1.6338625723415996 + }, + { + "name": "model.layers.34.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.2045790046831826e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.003624730510637e-05, + "sensitivity": 0.6470221227632623 + }, + { + "name": "model.layers.34.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.732463250751607e-05, + "sensitivity": 0.7072371241068811 + }, + { + "name": "model.layers.34.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.84883354754129e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006516308058053255, + "sensitivity": 0.5857838814410701 + }, + { + "name": "model.layers.34.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1378810086171143e-05, + "sensitivity": 1.3955447646577073 + }, + { + "name": "model.layers.34.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.950948995334329e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007179055246524513, + "sensitivity": 0.5331753267975146 + }, + { + "name": "model.layers.34.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0727528762072325e-05, + "sensitivity": 0.6716579573480425 + }, + { + "name": "model.layers.34.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.124002650016337e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006778436945751309, + "sensitivity": 0.5326784350305463 + }, + { + "name": "model.layers.34.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9245125157758594e-05, + "sensitivity": 0.9428875190747008 + }, + { + "name": "model.layers.34.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.302871267711453e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006735402857884765, + "sensitivity": 0.5507324959933722 + }, + { + "name": "model.layers.34.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.507039198462735e-06, + "sensitivity": 2.0970869950921247 + }, + { + "name": "model.layers.34.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.600389153594733e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007070069550536573, + "sensitivity": 0.5111261610200137 + }, + { + "name": "model.layers.34.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0395566278020851e-05, + "sensitivity": 1.525396831324092 + }, + { + "name": "model.layers.34.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0335578508602339e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006614046869799495, + "sensitivity": 0.562880169423452 + }, + { + "name": "model.layers.34.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.503005589460372e-06, + "sensitivity": 2.097424581741419 + }, + { + "name": "model.layers.34.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.11253962131741e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006903437897562981, + "sensitivity": 0.544582694739254 + }, + { + "name": "model.layers.34.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.826074240962043e-05, + "sensitivity": 1.0958068901889895 + }, + { + "name": "model.layers.34.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0837225090654101e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007977578788995743, + "sensitivity": 0.5609254854730026 + }, + { + "name": "model.layers.34.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.053931429050863e-05, + "sensitivity": 0.9898514797225189 + }, + { + "name": "model.layers.34.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.9216890905227046e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.148965621832758e-05, + "sensitivity": 0.6751209108834287 + }, + { + "name": "model.layers.34.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0086652764584869e-05, + "sensitivity": 1.233090697740095 + }, + { + "name": "model.layers.34.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.645238386226993e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.372654413804412e-05, + "sensitivity": 0.8693394098708487 + }, + { + "name": "model.layers.34.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7833207392832264e-05, + "sensitivity": 1.0866062888477162 + }, + { + "name": "model.layers.34.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0972896689054323e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006279895314946771, + "sensitivity": 0.5542885000832942 + }, + { + "name": "model.layers.34.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007126049022190273, + "sensitivity": 0.5796585863412235 + }, + { + "name": "model.layers.34.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.835926337269484e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007001174381002784, + "sensitivity": 0.5115820567486947 + }, + { + "name": "model.layers.34.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9799273003591225e-05, + "sensitivity": 0.6901166560536101 + }, + { + "name": "model.layers.34.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.846975679764e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006782313575968146, + "sensitivity": 0.5321935561105177 + }, + { + "name": "model.layers.34.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1877155884576496e-05, + "sensitivity": 1.4720899075842069 + }, + { + "name": "model.layers.34.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2622472240764182e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.538846355397254e-05, + "sensitivity": 0.6948403282946294 + }, + { + "name": "model.layers.34.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 2.4884384401957504e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.1798055058752652e-06, + "sensitivity": 2.101165805651614 + }, + { + "name": "model.layers.34.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.8697804762268788e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.34.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.5563781516902964e-06, + "sensitivity": 2.1016828044447946 + }, + { + "name": "model.layers.34.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 7.99723966338206e-06, + "sensitivity": 2.2026844665975402 + }, + { + "name": "model.layers.34.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00018199138867203146, + "sensitivity": 0.9569487031581467 + }, + { + "name": "model.layers.34.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.568809057062026e-05, + "sensitivity": 1.4101238499095523 + }, + { + "name": "model.layers.34.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.361348303267732e-05, + "sensitivity": 0.709301810261124 + }, + { + "name": "model.layers.34.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00029668156639672816, + "sensitivity": 0.811892795330873 + }, + { + "name": "model.layers.35.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.70618431083858e-05, + "sensitivity": 1.0991253008030595 + }, + { + "name": "model.layers.35.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1424307331253658e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006386045715771616, + "sensitivity": 0.5335525931637266 + }, + { + "name": "model.layers.35.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4359941714210436e-05, + "sensitivity": 0.8840672425538806 + }, + { + "name": "model.layers.35.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0359588031860767e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006100083119235933, + "sensitivity": 0.5816245967245918 + }, + { + "name": "model.layers.35.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0829574421222787e-05, + "sensitivity": 1.3377334911122236 + }, + { + "name": "model.layers.35.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5389603049698053e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.451339868362993e-05, + "sensitivity": 0.6412481509987683 + }, + { + "name": "model.layers.35.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.868312291568145e-05, + "sensitivity": 1.0711933971764047 + }, + { + "name": "model.layers.35.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.097270569516695e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006542782066389918, + "sensitivity": 0.5487574227791796 + }, + { + "name": "model.layers.35.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0156160897167865e-05, + "sensitivity": 1.944065664453109 + }, + { + "name": "model.layers.35.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.069057134372997e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.492334457812831e-05, + "sensitivity": 0.7091742828328679 + }, + { + "name": "model.layers.35.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.635496199829504e-05, + "sensitivity": 0.8790567488155168 + }, + { + "name": "model.layers.35.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1596533795454889e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006356982048600912, + "sensitivity": 0.5505319843789369 + }, + { + "name": "model.layers.35.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.678994395770133e-05, + "sensitivity": 0.8683572425077949 + }, + { + "name": "model.layers.35.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.068061217476497e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007849936373531818, + "sensitivity": 0.5479522504023678 + }, + { + "name": "model.layers.35.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.894468631595373e-05, + "sensitivity": 0.7061949481807932 + }, + { + "name": "model.layers.35.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.598537419857166e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006555598229169846, + "sensitivity": 0.5196422105844097 + }, + { + "name": "model.layers.35.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.440957804443315e-05, + "sensitivity": 0.602746469228769 + }, + { + "name": "model.layers.35.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.06949037976301e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007105536642484367, + "sensitivity": 0.5385789417733174 + }, + { + "name": "model.layers.35.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.474636029452085e-05, + "sensitivity": 0.6050056071796563 + }, + { + "name": "model.layers.35.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0398114227427868e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007124672411009669, + "sensitivity": 0.5616764199483478 + }, + { + "name": "model.layers.35.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.436184048652649e-05, + "sensitivity": 0.861222477643339 + }, + { + "name": "model.layers.35.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.071090537152486e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007195805665105581, + "sensitivity": 0.5600039351904381 + }, + { + "name": "model.layers.35.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.481646803673357e-05, + "sensitivity": 0.7983123723549397 + }, + { + "name": "model.layers.35.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2376494851196185e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006257315981201828, + "sensitivity": 0.530401052892314 + }, + { + "name": "model.layers.35.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0451653906784486e-05, + "sensitivity": 1.218425074334331 + }, + { + "name": "model.layers.35.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1715186474248185e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006462531164288521, + "sensitivity": 0.5713204137268588 + }, + { + "name": "model.layers.35.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.950669219600968e-05, + "sensitivity": 0.6306298324093531 + }, + { + "name": "model.layers.35.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.013080350276141e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006570501136593521, + "sensitivity": 0.550030243653942 + }, + { + "name": "model.layers.35.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0770933487219736e-05, + "sensitivity": 0.6674083867765931 + }, + { + "name": "model.layers.35.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.434892263016081e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000672280672006309, + "sensitivity": 0.5418020566923357 + }, + { + "name": "model.layers.35.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.994080856908113e-05, + "sensitivity": 1.047286928775542 + }, + { + "name": "model.layers.35.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1148380281156278e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006776444497518241, + "sensitivity": 0.5382571641010755 + }, + { + "name": "model.layers.35.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.070172856998397e-05, + "sensitivity": 1.3469971518328334 + }, + { + "name": "model.layers.35.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5214599216051283e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.882512414245866e-05, + "sensitivity": 0.6422535228900591 + }, + { + "name": "model.layers.35.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.795253673568368e-05, + "sensitivity": 1.0409013292882752 + }, + { + "name": "model.layers.35.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.068821120497887e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006542092887684703, + "sensitivity": 0.5527116395836542 + }, + { + "name": "model.layers.35.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0685384040698409e-05, + "sensitivity": 1.541086537671292 + }, + { + "name": "model.layers.35.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1337342584738508e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006532776169478893, + "sensitivity": 0.5287220877439335 + }, + { + "name": "model.layers.35.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0540707080508582e-05, + "sensitivity": 1.6423746393701064 + }, + { + "name": "model.layers.35.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.9834277484042104e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7545898016542196e-05, + "sensitivity": 0.6551774347662053 + }, + { + "name": "model.layers.35.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.01495812588837e-05, + "sensitivity": 0.6493685725324408 + }, + { + "name": "model.layers.35.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.29532496027241e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006920799496583641, + "sensitivity": 0.5297903047925777 + }, + { + "name": "model.layers.35.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0517060218262486e-05, + "sensitivity": 1.3534203996318983 + }, + { + "name": "model.layers.35.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.757563136896351e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006607254035770893, + "sensitivity": 0.5512299377451171 + }, + { + "name": "model.layers.35.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.256594158709049e-05, + "sensitivity": 0.9339139943157201 + }, + { + "name": "model.layers.35.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1900618801519158e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006116607692092657, + "sensitivity": 0.5719359603830647 + }, + { + "name": "model.layers.35.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.167267565615475e-05, + "sensitivity": 0.7199065603192373 + }, + { + "name": "model.layers.35.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.500907935944269e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006775010260753334, + "sensitivity": 0.5813643743095401 + }, + { + "name": "model.layers.35.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.080047387513332e-05, + "sensitivity": 0.7637973135896469 + }, + { + "name": "model.layers.35.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.265744213531434e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.058024519006722e-05, + "sensitivity": 0.6153857307836802 + }, + { + "name": "model.layers.35.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.278574437601492e-05, + "sensitivity": 0.6374147595922813 + }, + { + "name": "model.layers.35.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.560322501376504e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007133637554943562, + "sensitivity": 0.5178222037043779 + }, + { + "name": "model.layers.35.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007357698632404208, + "sensitivity": 0.5652300718162229 + }, + { + "name": "model.layers.35.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.701396948003094e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000732538930606097, + "sensitivity": 0.521019440753647 + }, + { + "name": "model.layers.35.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.811664595967159e-05, + "sensitivity": 0.6763219496161457 + }, + { + "name": "model.layers.35.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.730846280333935e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006698654033243656, + "sensitivity": 0.5487278900108788 + }, + { + "name": "model.layers.35.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.744825805071741e-05, + "sensitivity": 0.786950600459317 + }, + { + "name": "model.layers.35.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.886682619253406e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007577185751870275, + "sensitivity": 0.5713144812745226 + }, + { + "name": "model.layers.35.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.628553092014045e-05, + "sensitivity": 0.7999795141096475 + }, + { + "name": "model.layers.35.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.173339551831305e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.799225229769945e-05, + "sensitivity": 0.6469353221347525 + }, + { + "name": "model.layers.35.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006954201962798834, + "sensitivity": 0.5873240417849551 + }, + { + "name": "model.layers.35.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.347252335421217e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006952495314180851, + "sensitivity": 0.5333934741700551 + }, + { + "name": "model.layers.35.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.079291779315099e-05, + "sensitivity": 0.8435514046241619 + }, + { + "name": "model.layers.35.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4017900866747368e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.199085328262299e-05, + "sensitivity": 0.6096661507292274 + }, + { + "name": "model.layers.35.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006357368547469378, + "sensitivity": 0.5638659784620561 + }, + { + "name": "model.layers.35.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.581135944041307e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006415140233002603, + "sensitivity": 0.546470574242871 + }, + { + "name": "model.layers.35.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.115852046496002e-05, + "sensitivity": 1.593687941152419 + }, + { + "name": "model.layers.35.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.358795978187118e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.550576654262841e-05, + "sensitivity": 0.9503877544323037 + }, + { + "name": "model.layers.35.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.737843796145171e-05, + "sensitivity": 0.7973802162586449 + }, + { + "name": "model.layers.35.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1129008044008515e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007645506411790848, + "sensitivity": 0.5672743738707933 + }, + { + "name": "model.layers.35.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006870562210679054, + "sensitivity": 0.5995171994737869 + }, + { + "name": "model.layers.35.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1993320185865741e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006713428301736712, + "sensitivity": 0.5391335303472728 + }, + { + "name": "model.layers.35.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0993821888405364e-05, + "sensitivity": 1.248577801088478 + }, + { + "name": "model.layers.35.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2028760920657078e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006559576722793281, + "sensitivity": 0.522490785380921 + }, + { + "name": "model.layers.35.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7463264965917915e-05, + "sensitivity": 1.1033267873658048 + }, + { + "name": "model.layers.35.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.711975402140524e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006373663782142103, + "sensitivity": 0.5328036127902328 + }, + { + "name": "model.layers.35.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.092158946557902e-05, + "sensitivity": 0.9498970113979277 + }, + { + "name": "model.layers.35.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.215615932589571e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006796100060455501, + "sensitivity": 0.5187139857414349 + }, + { + "name": "model.layers.35.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.920112016610801e-05, + "sensitivity": 0.7984818434758493 + }, + { + "name": "model.layers.35.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0632263638399309e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006603614310733974, + "sensitivity": 0.5231039432909949 + }, + { + "name": "model.layers.35.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.2101764595136046e-05, + "sensitivity": 0.609707986402257 + }, + { + "name": "model.layers.35.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.286053348958376e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006028921343386173, + "sensitivity": 0.5311876161612147 + }, + { + "name": "model.layers.35.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9473150031408295e-05, + "sensitivity": 0.7451729020679763 + }, + { + "name": "model.layers.35.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.954061859687499e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006660178187303245, + "sensitivity": 0.5171516642606113 + }, + { + "name": "model.layers.35.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6319666327908635e-05, + "sensitivity": 0.6794653749016638 + }, + { + "name": "model.layers.35.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.898816415443434e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006338850362226367, + "sensitivity": 0.5591249339564277 + }, + { + "name": "model.layers.35.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.989064811728895e-05, + "sensitivity": 0.6609322029408489 + }, + { + "name": "model.layers.35.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.792647582187783e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006737876683473587, + "sensitivity": 0.5442244715459172 + }, + { + "name": "model.layers.35.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.060202187858522e-05, + "sensitivity": 0.7114875667037105 + }, + { + "name": "model.layers.35.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2097585795345367e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.235466910060495e-05, + "sensitivity": 0.7725651026311318 + }, + { + "name": "model.layers.35.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.106073124101385e-05, + "sensitivity": 0.7129473992420127 + }, + { + "name": "model.layers.35.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.105666115108761e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006691885646432638, + "sensitivity": 0.5393813650654562 + }, + { + "name": "model.layers.35.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.81150850141421e-05, + "sensitivity": 1.091510395383787 + }, + { + "name": "model.layers.35.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.375045806336857e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.577950600534678e-05, + "sensitivity": 1.006115737219582 + }, + { + "name": "model.layers.35.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.427732685348019e-05, + "sensitivity": 0.8332704385087744 + }, + { + "name": "model.layers.35.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4448098681896226e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006172447465360165, + "sensitivity": 0.5940239237940906 + }, + { + "name": "model.layers.35.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.778052582172677e-05, + "sensitivity": 1.1529155944414513 + }, + { + "name": "model.layers.35.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.8832631667464739e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006367457681335509, + "sensitivity": 0.5852755029192445 + }, + { + "name": "model.layers.35.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.5821725557761965e-06, + "sensitivity": 2.097214945003743 + }, + { + "name": "model.layers.35.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5941762967486284e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.359293911373243e-05, + "sensitivity": 0.6555078010627673 + }, + { + "name": "model.layers.35.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1505731890792958e-05, + "sensitivity": 1.4939884584062102 + }, + { + "name": "model.layers.35.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1689753591781482e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007119998335838318, + "sensitivity": 0.5232148382310686 + }, + { + "name": "model.layers.35.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0470320022432134e-05, + "sensitivity": 1.00372107165827 + }, + { + "name": "model.layers.35.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0677903219402651e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006696053314954042, + "sensitivity": 0.5542800849817628 + }, + { + "name": "model.layers.35.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5009899369906634e-05, + "sensitivity": 0.709856922108981 + }, + { + "name": "model.layers.35.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1569867410798906e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006622436339966953, + "sensitivity": 0.5406980022220088 + }, + { + "name": "model.layers.35.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006992264534346759, + "sensitivity": 0.5841641530823175 + }, + { + "name": "model.layers.35.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.081315516188624e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007071515428833663, + "sensitivity": 0.5464882386945282 + }, + { + "name": "model.layers.35.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.757948383688927e-05, + "sensitivity": 0.8471379264065128 + }, + { + "name": "model.layers.35.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.804370968893636e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000639239908196032, + "sensitivity": 0.5511641448197959 + }, + { + "name": "model.layers.35.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.130263606493827e-06, + "sensitivity": 1.5889336382791874 + }, + { + "name": "model.layers.35.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.57017766975332e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005977295222692192, + "sensitivity": 0.578765967948971 + }, + { + "name": "model.layers.35.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.64440914685838e-06, + "sensitivity": 1.2212980736134367 + }, + { + "name": "model.layers.35.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2424046644810005e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000597527134232223, + "sensitivity": 0.5537179257818203 + }, + { + "name": "model.layers.35.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.43511523574125e-05, + "sensitivity": 0.8725337699400386 + }, + { + "name": "model.layers.35.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.002697882147913e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006069475784897804, + "sensitivity": 0.5498525465366291 + }, + { + "name": "model.layers.35.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.014588143443689e-05, + "sensitivity": 0.9962118748055571 + }, + { + "name": "model.layers.35.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.216074906551512e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000675952760502696, + "sensitivity": 0.5605988405876947 + }, + { + "name": "model.layers.35.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0991370800184086e-05, + "sensitivity": 1.7862676007467462 + }, + { + "name": "model.layers.35.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.412592951055558e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006926755886524916, + "sensitivity": 0.5804275417077893 + }, + { + "name": "model.layers.35.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.919995601288974e-05, + "sensitivity": 0.7234696589600151 + }, + { + "name": "model.layers.35.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0597540267553995e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006775592337362468, + "sensitivity": 0.5422542011982986 + }, + { + "name": "model.layers.35.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.92062933719717e-05, + "sensitivity": 1.1838927008434639 + }, + { + "name": "model.layers.35.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.426816637234879e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006750643951818347, + "sensitivity": 0.5496560364198025 + }, + { + "name": "model.layers.35.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.046970884199254e-05, + "sensitivity": 0.7322930448950298 + }, + { + "name": "model.layers.35.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.348525059569511e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007005219231359661, + "sensitivity": 0.5624076877850529 + }, + { + "name": "model.layers.35.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0574261068541091e-05, + "sensitivity": 1.8026474699237967 + }, + { + "name": "model.layers.35.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2840240515288315e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006399333942681551, + "sensitivity": 0.5528825490988984 + }, + { + "name": "model.layers.35.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 2.235860392829636e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.5634903977334034e-06, + "sensitivity": 2.101996102787218 + }, + { + "name": "model.layers.35.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.257424966956023e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.35.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.5992445696610957e-06, + "sensitivity": 2.1027581388642904 + }, + { + "name": "model.layers.35.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 7.800614184816368e-06, + "sensitivity": 2.1505106287123117 + }, + { + "name": "model.layers.35.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00016956492618191987, + "sensitivity": 0.9010917258888543 + }, + { + "name": "model.layers.35.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.604637691343669e-05, + "sensitivity": 1.6096531391260205 + }, + { + "name": "model.layers.35.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 4.943474050378427e-05, + "sensitivity": 0.7476913648792373 + }, + { + "name": "model.layers.35.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00029013227322138846, + "sensitivity": 0.7264488893333413 + }, + { + "name": "model.layers.36.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.668676385539584e-05, + "sensitivity": 0.9640336223432616 + }, + { + "name": "model.layers.36.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3135334029357182e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.690589750884101e-05, + "sensitivity": 0.7129996317690679 + }, + { + "name": "model.layers.36.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.962895738775842e-05, + "sensitivity": 0.8959729241275801 + }, + { + "name": "model.layers.36.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1550600902410224e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006544087082147598, + "sensitivity": 0.5465737048542805 + }, + { + "name": "model.layers.36.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006941991741769016, + "sensitivity": 0.5618890343884857 + }, + { + "name": "model.layers.36.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.016852593238582e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007054070010781288, + "sensitivity": 0.5440575995655275 + }, + { + "name": "model.layers.36.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.849979061167687e-05, + "sensitivity": 0.6721901546598549 + }, + { + "name": "model.layers.36.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.203219881062978e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006776090594939888, + "sensitivity": 0.564015622377662 + }, + { + "name": "model.layers.36.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8748228184413165e-05, + "sensitivity": 1.0874910130291084 + }, + { + "name": "model.layers.36.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.7718875824357383e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006823347648605704, + "sensitivity": 0.544625672887157 + }, + { + "name": "model.layers.36.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.026951450621709e-05, + "sensitivity": 0.8288769534324171 + }, + { + "name": "model.layers.36.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.351092676799453e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006891156081110239, + "sensitivity": 0.5348018241494691 + }, + { + "name": "model.layers.36.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7759840274229646e-05, + "sensitivity": 0.9884530292175214 + }, + { + "name": "model.layers.36.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.165736193797784e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006851445650681853, + "sensitivity": 0.5253703778888019 + }, + { + "name": "model.layers.36.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0736946933320723e-05, + "sensitivity": 1.329990892548208 + }, + { + "name": "model.layers.36.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.962535634447704e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0854043113067746e-05, + "sensitivity": 0.7292771622348906 + }, + { + "name": "model.layers.36.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.918125680182129e-05, + "sensitivity": 0.6897980767829062 + }, + { + "name": "model.layers.36.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.246757031178277e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006582018686458468, + "sensitivity": 0.546522356038087 + }, + { + "name": "model.layers.36.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.670665268553421e-05, + "sensitivity": 0.9675545780015022 + }, + { + "name": "model.layers.36.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2413274816935882e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006358489627018571, + "sensitivity": 0.5848587078668935 + }, + { + "name": "model.layers.36.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0209178071818314e-05, + "sensitivity": 1.238094149590065 + }, + { + "name": "model.layers.36.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1642566732916748e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000635845004580915, + "sensitivity": 0.5495772422687493 + }, + { + "name": "model.layers.36.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.959994450677186e-05, + "sensitivity": 0.715650550204975 + }, + { + "name": "model.layers.36.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.02360388609668e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00067283830139786, + "sensitivity": 0.5289990068362125 + }, + { + "name": "model.layers.36.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3157599571277387e-06, + "sensitivity": 2.0977221956395917 + }, + { + "name": "model.layers.36.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.58927423399291e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.119477620813996e-05, + "sensitivity": 0.6975604884095079 + }, + { + "name": "model.layers.36.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.425456841592677e-06, + "sensitivity": 2.098046124713189 + }, + { + "name": "model.layers.36.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.518637304798176e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.202734948601574e-05, + "sensitivity": 1.0308489715978004 + }, + { + "name": "model.layers.36.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.852523463545367e-05, + "sensitivity": 0.6419502694478354 + }, + { + "name": "model.layers.36.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.341172719548922e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.827449422213249e-05, + "sensitivity": 0.6040139246663586 + }, + { + "name": "model.layers.36.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.639532901113853e-05, + "sensitivity": 0.8996637134516249 + }, + { + "name": "model.layers.36.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.865009254397592e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000627523404546082, + "sensitivity": 0.5349962787419901 + }, + { + "name": "model.layers.36.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.475596455857158e-05, + "sensitivity": 0.9650248734060936 + }, + { + "name": "model.layers.36.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0230453426629538e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000726040918380022, + "sensitivity": 0.553827823526564 + }, + { + "name": "model.layers.36.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.831756425322965e-05, + "sensitivity": 0.821269856299335 + }, + { + "name": "model.layers.36.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.615073738837964e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006716576172038913, + "sensitivity": 0.5575229932450995 + }, + { + "name": "model.layers.36.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0641556046903133e-05, + "sensitivity": 0.7426177871863742 + }, + { + "name": "model.layers.36.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0089460147355567e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.070926247048192e-05, + "sensitivity": 0.607932400049435 + }, + { + "name": "model.layers.36.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.181591743370518e-05, + "sensitivity": 0.6420813982500548 + }, + { + "name": "model.layers.36.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.0139344643394e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006894014659337699, + "sensitivity": 0.5490337195876179 + }, + { + "name": "model.layers.36.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0088554164394736e-05, + "sensitivity": 0.6568147679207645 + }, + { + "name": "model.layers.36.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.732601605108357e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.029329597367905e-05, + "sensitivity": 0.6667319890844 + }, + { + "name": "model.layers.36.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9565492847468704e-05, + "sensitivity": 0.8450725999895237 + }, + { + "name": "model.layers.36.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0169870847676066e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006585392984561622, + "sensitivity": 0.5177990920734435 + }, + { + "name": "model.layers.36.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.181406206451356e-05, + "sensitivity": 0.8731819401306434 + }, + { + "name": "model.layers.36.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.963933737504703e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007003047503530979, + "sensitivity": 0.5343592213490982 + }, + { + "name": "model.layers.36.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0459551958774682e-05, + "sensitivity": 1.5242070768531772 + }, + { + "name": "model.layers.36.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.995243211349589e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00061449920758605, + "sensitivity": 0.5245936523537305 + }, + { + "name": "model.layers.36.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.13287920714356e-05, + "sensitivity": 1.0279960410641238 + }, + { + "name": "model.layers.36.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.655916078874725e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006759327370673418, + "sensitivity": 0.5324166055247583 + }, + { + "name": "model.layers.36.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.54269169899635e-05, + "sensitivity": 1.0468958389347323 + }, + { + "name": "model.layers.36.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.017398517433321e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.700131052639335e-05, + "sensitivity": 0.6666338358701549 + }, + { + "name": "model.layers.36.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.908314389875159e-05, + "sensitivity": 0.7435513493970665 + }, + { + "name": "model.layers.36.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0590541705823853e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008159849676303566, + "sensitivity": 0.539085835417511 + }, + { + "name": "model.layers.36.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.720780973206274e-05, + "sensitivity": 1.0398102006294323 + }, + { + "name": "model.layers.36.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.132068731152685e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000634964439086616, + "sensitivity": 0.5351771075419581 + }, + { + "name": "model.layers.36.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000734447268769145, + "sensitivity": 0.5902420603966676 + }, + { + "name": "model.layers.36.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0472106168890605e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007385943899862468, + "sensitivity": 0.528432508377599 + }, + { + "name": "model.layers.36.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.369512993842363e-05, + "sensitivity": 0.626051071577809 + }, + { + "name": "model.layers.36.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.513865855595213e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006978057208471, + "sensitivity": 0.5704271474252549 + }, + { + "name": "model.layers.36.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.803361535887234e-06, + "sensitivity": 1.810844067356358 + }, + { + "name": "model.layers.36.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.111821555052302e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.2466290071606636e-05, + "sensitivity": 0.7193675559089636 + }, + { + "name": "model.layers.36.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.411189679056406e-05, + "sensitivity": 1.1392373513882688 + }, + { + "name": "model.layers.36.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.5912794272881e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007239388069137931, + "sensitivity": 0.5337674047045035 + }, + { + "name": "model.layers.36.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0678957551135682e-05, + "sensitivity": 1.3845916073080906 + }, + { + "name": "model.layers.36.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5112116216187133e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.807169509353116e-05, + "sensitivity": 0.7384261230559778 + }, + { + "name": "model.layers.36.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.096934885135852e-05, + "sensitivity": 1.0661468892079558 + }, + { + "name": "model.layers.36.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.601612873666454e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006818177062086761, + "sensitivity": 0.5427217163177741 + }, + { + "name": "model.layers.36.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0651125194272026e-05, + "sensitivity": 1.4551886075307705 + }, + { + "name": "model.layers.36.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.071320050679788e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006480823503807187, + "sensitivity": 0.5387879346049439 + }, + { + "name": "model.layers.36.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.775857425760478e-05, + "sensitivity": 0.7334879943850212 + }, + { + "name": "model.layers.36.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.22509912015812e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006380357663147151, + "sensitivity": 0.5504078107132487 + }, + { + "name": "model.layers.36.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.683056588168256e-05, + "sensitivity": 0.7460235653442535 + }, + { + "name": "model.layers.36.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.55738733207545e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006753659690730274, + "sensitivity": 0.5410181399277114 + }, + { + "name": "model.layers.36.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.459267024183646e-05, + "sensitivity": 0.9157599125110993 + }, + { + "name": "model.layers.36.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1399504273867933e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.43450184725225e-05, + "sensitivity": 0.6242180440735996 + }, + { + "name": "model.layers.36.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.50553340872284e-05, + "sensitivity": 1.0206746389930885 + }, + { + "name": "model.layers.36.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.125227057258599e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.3447511163540184e-05, + "sensitivity": 0.6103149591029337 + }, + { + "name": "model.layers.36.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0206290072528645e-05, + "sensitivity": 0.811226410788321 + }, + { + "name": "model.layers.36.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2025005844407133e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000680436089169234, + "sensitivity": 0.5776488091202794 + }, + { + "name": "model.layers.36.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5866890761535615e-05, + "sensitivity": 0.7218844687080449 + }, + { + "name": "model.layers.36.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.696295369896688e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000628418056294322, + "sensitivity": 0.5626676524104116 + }, + { + "name": "model.layers.36.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.356934318318963e-05, + "sensitivity": 0.7412858081147318 + }, + { + "name": "model.layers.36.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.549958240815613e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007178589585237205, + "sensitivity": 0.5294890766676 + }, + { + "name": "model.layers.36.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.221088859892916e-05, + "sensitivity": 1.2375017165583162 + }, + { + "name": "model.layers.36.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.71440988703398e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.570393063360825e-05, + "sensitivity": 0.6789214208743111 + }, + { + "name": "model.layers.36.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.945716839050874e-05, + "sensitivity": 1.1024347223527429 + }, + { + "name": "model.layers.36.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4030504189577186e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000662908423691988, + "sensitivity": 0.5536401622840835 + }, + { + "name": "model.layers.36.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.374837094976101e-06, + "sensitivity": 2.0972730538820117 + }, + { + "name": "model.layers.36.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.471066277910722e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006757731316611171, + "sensitivity": 0.522009612229682 + }, + { + "name": "model.layers.36.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4934679458965547e-06, + "sensitivity": 2.098493137667436 + }, + { + "name": "model.layers.36.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.3165548554970883e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.786112160421908e-05, + "sensitivity": 1.067276960746323 + }, + { + "name": "model.layers.36.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.23839077888988e-05, + "sensitivity": 0.9489770706543199 + }, + { + "name": "model.layers.36.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0761461908259662e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006839242996647954, + "sensitivity": 0.5227470200263583 + }, + { + "name": "model.layers.36.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.492462125606835e-05, + "sensitivity": 0.7503371383309553 + }, + { + "name": "model.layers.36.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.84104417511844e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007500160718336701, + "sensitivity": 0.549507135386226 + }, + { + "name": "model.layers.36.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.710976984119043e-05, + "sensitivity": 1.0560574061590093 + }, + { + "name": "model.layers.36.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.499116231381777e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9287453041179106e-05, + "sensitivity": 0.7072378614230035 + }, + { + "name": "model.layers.36.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.125147774582729e-05, + "sensitivity": 1.0084038640783672 + }, + { + "name": "model.layers.36.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.283530862878251e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006767324521206319, + "sensitivity": 0.5314523208526389 + }, + { + "name": "model.layers.36.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1257325240876526e-05, + "sensitivity": 1.4118462914245062 + }, + { + "name": "model.layers.36.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.0129555196035653e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.947204044787213e-05, + "sensitivity": 0.6886529744873622 + }, + { + "name": "model.layers.36.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006696636555716395, + "sensitivity": 0.5494978121908493 + }, + { + "name": "model.layers.36.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.125281283355434e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006698934594169259, + "sensitivity": 0.5287469887521085 + }, + { + "name": "model.layers.36.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.618872430408373e-05, + "sensitivity": 0.6343835776202407 + }, + { + "name": "model.layers.36.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.09311438590521e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007409563986584544, + "sensitivity": 0.5355365947366015 + }, + { + "name": "model.layers.36.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0988539543177467e-05, + "sensitivity": 1.3624498787018338 + }, + { + "name": "model.layers.36.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.250993571185973e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006748826126568019, + "sensitivity": 0.5709995572723836 + }, + { + "name": "model.layers.36.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0569000197574496e-05, + "sensitivity": 0.8508277163514519 + }, + { + "name": "model.layers.36.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0993385330948513e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006830545607954264, + "sensitivity": 0.5903178761733927 + }, + { + "name": "model.layers.36.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0384026609244756e-05, + "sensitivity": 1.5259491511843795 + }, + { + "name": "model.layers.36.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5623470517311944e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.532040086109191e-05, + "sensitivity": 0.8592470903008779 + }, + { + "name": "model.layers.36.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.882831464987248e-05, + "sensitivity": 0.6484972197899835 + }, + { + "name": "model.layers.36.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.028889849105326e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006585276569239795, + "sensitivity": 0.5733988919231214 + }, + { + "name": "model.layers.36.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.064047228283016e-05, + "sensitivity": 1.365259427216087 + }, + { + "name": "model.layers.36.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1592276223382214e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000634188880212605, + "sensitivity": 0.5953594298887261 + }, + { + "name": "model.layers.36.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0877275245729834e-05, + "sensitivity": 0.6177985793417997 + }, + { + "name": "model.layers.36.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.299274216165941e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006708285072818398, + "sensitivity": 0.5507102626573779 + }, + { + "name": "model.layers.36.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.2071599485352635e-05, + "sensitivity": 1.3048750746124196 + }, + { + "name": "model.layers.36.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.107966434385162e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007701545837335289, + "sensitivity": 0.5619328214493994 + }, + { + "name": "model.layers.36.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006736309151165187, + "sensitivity": 0.5324677635138738 + }, + { + "name": "model.layers.36.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.850726776974625e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006757138180546463, + "sensitivity": 0.5409467330757185 + }, + { + "name": "model.layers.36.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.189431587699801e-05, + "sensitivity": 0.6587449613320135 + }, + { + "name": "model.layers.36.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.022585820464883e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.212417792994529e-05, + "sensitivity": 0.6263193559924018 + }, + { + "name": "model.layers.36.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.482443505869014e-06, + "sensitivity": 2.097130491516435 + }, + { + "name": "model.layers.36.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.619687943995814e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.59232828184031e-05, + "sensitivity": 0.6256681584751344 + }, + { + "name": "model.layers.36.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.188780389493331e-05, + "sensitivity": 1.086995745504538 + }, + { + "name": "model.layers.36.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.80552852575056e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.165164813864976e-05, + "sensitivity": 0.632624958399351 + }, + { + "name": "model.layers.36.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 2.135871454811422e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4085597942757886e-06, + "sensitivity": 2.1033973578890737 + }, + { + "name": "model.layers.36.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.9327427455427824e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.36.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.6801866422611056e-06, + "sensitivity": 2.1046438990440186 + }, + { + "name": "model.layers.36.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 7.549389010819141e-06, + "sensitivity": 2.1944605072919825 + }, + { + "name": "model.layers.36.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00019526755204424262, + "sensitivity": 1.1307676719923343 + }, + { + "name": "model.layers.36.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.7418473362340592e-05, + "sensitivity": 1.452552042528164 + }, + { + "name": "model.layers.36.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.0748029025271535e-05, + "sensitivity": 0.7665377373187339 + }, + { + "name": "model.layers.36.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0003096478758379817, + "sensitivity": 0.8873160293952393 + }, + { + "name": "model.layers.37.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.302124812558759e-06, + "sensitivity": 2.097452335337531 + }, + { + "name": "model.layers.37.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.12417433228984e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.896820221096277e-05, + "sensitivity": 0.7921372023782499 + }, + { + "name": "model.layers.37.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.389175541698933e-05, + "sensitivity": 0.7219127596064867 + }, + { + "name": "model.layers.37.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.35949344693654e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000741355586796999, + "sensitivity": 0.5568070985848861 + }, + { + "name": "model.layers.37.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.5106193030951545e-05, + "sensitivity": 0.6633723418220443 + }, + { + "name": "model.layers.37.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.204024884937098e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006339214160107076, + "sensitivity": 0.516335529400299 + }, + { + "name": "model.layers.37.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7829216530080885e-05, + "sensitivity": 0.7582129297948588 + }, + { + "name": "model.layers.37.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.567717830170295e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006413698429241776, + "sensitivity": 0.5507321083913294 + }, + { + "name": "model.layers.37.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1128735422971658e-05, + "sensitivity": 1.3700616603755014 + }, + { + "name": "model.layers.37.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.747691365191713e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006818644469603896, + "sensitivity": 0.5721479142177051 + }, + { + "name": "model.layers.37.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6381861213594675e-05, + "sensitivity": 0.9598977763178773 + }, + { + "name": "model.layers.37.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.754584198162775e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006472060922533274, + "sensitivity": 0.563560743996091 + }, + { + "name": "model.layers.37.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.802956729894504e-05, + "sensitivity": 1.0552206108301607 + }, + { + "name": "model.layers.37.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.484796131189796e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00063495640642941, + "sensitivity": 0.5410345943772726 + }, + { + "name": "model.layers.37.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7586126786191016e-05, + "sensitivity": 0.8605155551875342 + }, + { + "name": "model.layers.37.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.273434216083842e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.792734009446576e-05, + "sensitivity": 0.6996222121259377 + }, + { + "name": "model.layers.37.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.2730108210234903e-05, + "sensitivity": 1.264005302479709 + }, + { + "name": "model.layers.37.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.041020141201443e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.654509681742638e-05, + "sensitivity": 0.6666476808593517 + }, + { + "name": "model.layers.37.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.025940820109099e-05, + "sensitivity": 0.8626932921153915 + }, + { + "name": "model.layers.37.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6035735370678594e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000711114495061338, + "sensitivity": 0.5661815076716703 + }, + { + "name": "model.layers.37.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3642824089620262e-06, + "sensitivity": 2.0969615171880633 + }, + { + "name": "model.layers.37.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.295581455451611e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006611902499571443, + "sensitivity": 0.556768246469093 + }, + { + "name": "model.layers.37.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.765238165622577e-05, + "sensitivity": 0.6246352613889069 + }, + { + "name": "model.layers.37.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.054606498968496e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006551609258167446, + "sensitivity": 0.5439375638551006 + }, + { + "name": "model.layers.37.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.094669151934795e-05, + "sensitivity": 0.711999524484687 + }, + { + "name": "model.layers.37.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.837141993149999e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006958224694244564, + "sensitivity": 0.5570416800500859 + }, + { + "name": "model.layers.37.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0699570894939825e-05, + "sensitivity": 0.6824221586210265 + }, + { + "name": "model.layers.37.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.990987225843128e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006769397296011448, + "sensitivity": 0.5212081206000486 + }, + { + "name": "model.layers.37.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.514830602100119e-05, + "sensitivity": 0.6681365923450557 + }, + { + "name": "model.layers.37.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.239202091113839e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000745285942684859, + "sensitivity": 0.5445901282577901 + }, + { + "name": "model.layers.37.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.27272334996087e-06, + "sensitivity": 2.097196701441726 + }, + { + "name": "model.layers.37.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.004353730939329e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.562891601584852e-05, + "sensitivity": 0.6393174769851493 + }, + { + "name": "model.layers.37.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.53853639960289e-05, + "sensitivity": 0.7655649439565182 + }, + { + "name": "model.layers.37.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.460768524149898e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007522036321461201, + "sensitivity": 0.5305305803390639 + }, + { + "name": "model.layers.37.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1116399946331512e-05, + "sensitivity": 1.6397068868878408 + }, + { + "name": "model.layers.37.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.749327318786527e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006732783513143659, + "sensitivity": 0.5478337486025588 + }, + { + "name": "model.layers.37.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4753678644628963e-06, + "sensitivity": 2.0711763870655178 + }, + { + "name": "model.layers.37.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0159860721614677e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000689714855980128, + "sensitivity": 0.5221909400195582 + }, + { + "name": "model.layers.37.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1366965736669954e-05, + "sensitivity": 1.9609869586206166 + }, + { + "name": "model.layers.37.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.865016995201586e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.302844849415123e-05, + "sensitivity": 0.6168575310847293 + }, + { + "name": "model.layers.37.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.230920553207397e-05, + "sensitivity": 0.8498473773808541 + }, + { + "name": "model.layers.37.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.943162927404046e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006923649925738573, + "sensitivity": 0.5405471095811589 + }, + { + "name": "model.layers.37.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006958985468372703, + "sensitivity": 0.5297506409746597 + }, + { + "name": "model.layers.37.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.649422061855148e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006998521275818348, + "sensitivity": 0.5191337801130173 + }, + { + "name": "model.layers.37.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.186944665387273e-05, + "sensitivity": 0.8519602185680781 + }, + { + "name": "model.layers.37.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.900416332835448e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000699941418133676, + "sensitivity": 0.5428862868439883 + }, + { + "name": "model.layers.37.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.083494680642616e-05, + "sensitivity": 1.5297040600860812 + }, + { + "name": "model.layers.37.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.491730116271356e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006959427846595645, + "sensitivity": 0.5354872487826088 + }, + { + "name": "model.layers.37.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.169309199322015e-05, + "sensitivity": 0.8503140097137301 + }, + { + "name": "model.layers.37.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.615719255227305e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006972586270421743, + "sensitivity": 0.5284244582940595 + }, + { + "name": "model.layers.37.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.093215360015165e-05, + "sensitivity": 1.2212163005156236 + }, + { + "name": "model.layers.37.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.656230991415214e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006491739768534899, + "sensitivity": 0.5325524421734972 + }, + { + "name": "model.layers.37.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.684213829226792e-05, + "sensitivity": 0.6572863949051713 + }, + { + "name": "model.layers.37.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.011159724839672e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006349403411149979, + "sensitivity": 0.5605172066252299 + }, + { + "name": "model.layers.37.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4441801542707253e-06, + "sensitivity": 2.0980290268640456 + }, + { + "name": "model.layers.37.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.8294484789294074e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.306679279077798e-05, + "sensitivity": 0.7630241909422757 + }, + { + "name": "model.layers.37.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000683446298353374, + "sensitivity": 0.5718973273889251 + }, + { + "name": "model.layers.37.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.713724923836708e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006748434971086681, + "sensitivity": 0.5283168754136961 + }, + { + "name": "model.layers.37.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7480603572912514e-05, + "sensitivity": 1.0537997630210352 + }, + { + "name": "model.layers.37.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4402638726096484e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0575919633265585e-05, + "sensitivity": 0.7946288974825142 + }, + { + "name": "model.layers.37.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.810303264297545e-05, + "sensitivity": 0.6555779267110555 + }, + { + "name": "model.layers.37.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2314778814470628e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006537241279147565, + "sensitivity": 0.5862601638849012 + }, + { + "name": "model.layers.37.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.2508464907296e-05, + "sensitivity": 0.970509945816625 + }, + { + "name": "model.layers.37.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0489645774214296e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006891717202961445, + "sensitivity": 0.5156520844781036 + }, + { + "name": "model.layers.37.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.067997310310602e-05, + "sensitivity": 0.7992541945316728 + }, + { + "name": "model.layers.37.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4284368035077932e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006770477630198002, + "sensitivity": 0.5743152870027705 + }, + { + "name": "model.layers.37.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.245107215363532e-05, + "sensitivity": 0.719531326721042 + }, + { + "name": "model.layers.37.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0509995718166465e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.127853703219444e-05, + "sensitivity": 0.6477428766594358 + }, + { + "name": "model.layers.37.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0660706720955204e-05, + "sensitivity": 1.9710391840108836 + }, + { + "name": "model.layers.37.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0091016520163976e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006412186776287854, + "sensitivity": 0.5088055154310436 + }, + { + "name": "model.layers.37.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7212608226109296e-05, + "sensitivity": 0.9328043133181236 + }, + { + "name": "model.layers.37.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.776209258736344e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006299125961959362, + "sensitivity": 0.5842508073259671 + }, + { + "name": "model.layers.37.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1167439879500307e-05, + "sensitivity": 1.31137204304954 + }, + { + "name": "model.layers.37.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2373210438454407e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.055086851119995e-05, + "sensitivity": 0.6693938467451219 + }, + { + "name": "model.layers.37.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0220627347007394e-05, + "sensitivity": 0.8915977765906784 + }, + { + "name": "model.layers.37.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.45181625411351e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006736153736710548, + "sensitivity": 0.551629779007532 + }, + { + "name": "model.layers.37.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.16139150224626e-05, + "sensitivity": 0.6468572061501534 + }, + { + "name": "model.layers.37.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.244876769618713e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006723962724208832, + "sensitivity": 0.5142558823983778 + }, + { + "name": "model.layers.37.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.187464896356687e-05, + "sensitivity": 0.6911714096812139 + }, + { + "name": "model.layers.37.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.134232434196747e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006845792522653937, + "sensitivity": 0.5446161175166592 + }, + { + "name": "model.layers.37.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.022815068718046e-05, + "sensitivity": 0.9820657634935785 + }, + { + "name": "model.layers.37.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.935732699275832e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006805739249102771, + "sensitivity": 0.549917102827771 + }, + { + "name": "model.layers.37.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0943853339995258e-05, + "sensitivity": 1.7381985756819223 + }, + { + "name": "model.layers.37.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.934478733455762e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.943485302850604e-05, + "sensitivity": 0.6596687729967982 + }, + { + "name": "model.layers.37.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9473088185768574e-05, + "sensitivity": 0.8920275092829615 + }, + { + "name": "model.layers.37.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.065453241419164e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006441720761358738, + "sensitivity": 0.5462316276126933 + }, + { + "name": "model.layers.37.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9827056247740984e-05, + "sensitivity": 0.8005337985460637 + }, + { + "name": "model.layers.37.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.123493332983344e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006594903534278274, + "sensitivity": 0.5100425383967019 + }, + { + "name": "model.layers.37.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1518297469592653e-05, + "sensitivity": 1.3879762734429852 + }, + { + "name": "model.layers.37.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.732941753602063e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007081359508447349, + "sensitivity": 0.5644349857285658 + }, + { + "name": "model.layers.37.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.193906301632524e-05, + "sensitivity": 0.6873111121505817 + }, + { + "name": "model.layers.37.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.269386514963116e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006802353891544044, + "sensitivity": 0.5162391114177705 + }, + { + "name": "model.layers.37.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4623807955067605e-05, + "sensitivity": 0.9460798911165089 + }, + { + "name": "model.layers.37.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6311605577357113e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.3069088608026505e-05, + "sensitivity": 0.6393201690116905 + }, + { + "name": "model.layers.37.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1639006515906658e-05, + "sensitivity": 1.2235306861746142 + }, + { + "name": "model.layers.37.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4959522331992048e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.429952918551862e-05, + "sensitivity": 0.7281708606492134 + }, + { + "name": "model.layers.37.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9246347518637776e-05, + "sensitivity": 0.8100237819486493 + }, + { + "name": "model.layers.37.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.569563417244353e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006421346915885806, + "sensitivity": 0.5279682681546277 + }, + { + "name": "model.layers.37.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.164993828861043e-05, + "sensitivity": 0.825384085346361 + }, + { + "name": "model.layers.37.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0138396646652836e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006927895592525601, + "sensitivity": 0.5101231465199407 + }, + { + "name": "model.layers.37.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.750307900598273e-05, + "sensitivity": 0.7597483983713151 + }, + { + "name": "model.layers.37.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.132627501960087e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006501316092908382, + "sensitivity": 0.5273457405786252 + }, + { + "name": "model.layers.37.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.846087515237741e-05, + "sensitivity": 0.9236901214394716 + }, + { + "name": "model.layers.37.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4352447124110768e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006698904326185584, + "sensitivity": 0.5992858287529784 + }, + { + "name": "model.layers.37.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.901986489538103e-05, + "sensitivity": 0.7126783236756877 + }, + { + "name": "model.layers.37.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.907125786412507e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008026680443435907, + "sensitivity": 0.5459478657679557 + }, + { + "name": "model.layers.37.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.273431790759787e-05, + "sensitivity": 1.1847278515481288 + }, + { + "name": "model.layers.37.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.45285001105367e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007479221094399691, + "sensitivity": 0.5606961864213786 + }, + { + "name": "model.layers.37.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.1140674562047934e-06, + "sensitivity": 2.09707789146728 + }, + { + "name": "model.layers.37.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.714534942555474e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 4.982907194062136e-05, + "sensitivity": 0.6997687064355231 + }, + { + "name": "model.layers.37.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.584209768334404e-05, + "sensitivity": 0.7105042581769656 + }, + { + "name": "model.layers.37.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.899263891886221e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007648984901607037, + "sensitivity": 0.5424628158993285 + }, + { + "name": "model.layers.37.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.311644392553717e-05, + "sensitivity": 0.6009033639897583 + }, + { + "name": "model.layers.37.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.685067657803302e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006962268380448222, + "sensitivity": 0.5248251488921027 + }, + { + "name": "model.layers.37.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7643057516543195e-05, + "sensitivity": 0.9008569218404563 + }, + { + "name": "model.layers.37.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.308702715316031e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6666780437808484e-05, + "sensitivity": 0.7839186093973789 + }, + { + "name": "model.layers.37.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.890681495657191e-05, + "sensitivity": 0.6941545844308298 + }, + { + "name": "model.layers.37.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.716875529695244e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006469757645390928, + "sensitivity": 0.5265873871565041 + }, + { + "name": "model.layers.37.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.2412100406654645e-06, + "sensitivity": 2.097489371874163 + }, + { + "name": "model.layers.37.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0800115433085011e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.3102463425602764e-05, + "sensitivity": 1.0752350784577989 + }, + { + "name": "model.layers.37.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9430945839267224e-05, + "sensitivity": 0.6240700466467385 + }, + { + "name": "model.layers.37.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.036154213186819e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006674231262877584, + "sensitivity": 0.5516167955671343 + }, + { + "name": "model.layers.37.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0733531427104026e-05, + "sensitivity": 0.6602722870435423 + }, + { + "name": "model.layers.37.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.240046215883922e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006778130773454905, + "sensitivity": 0.5151939220837308 + }, + { + "name": "model.layers.37.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.960347698419355e-05, + "sensitivity": 0.9600211299643083 + }, + { + "name": "model.layers.37.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.108719953270338e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006849092314951122, + "sensitivity": 0.5286221778623037 + }, + { + "name": "model.layers.37.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.893439083592966e-05, + "sensitivity": 0.6586392020387694 + }, + { + "name": "model.layers.37.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.780119742368697e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006442448357120156, + "sensitivity": 0.5424659202123847 + }, + { + "name": "model.layers.37.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 2.0319412215030752e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.5518475013086572e-06, + "sensitivity": 2.1031899015091904 + }, + { + "name": "model.layers.37.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 3.1521030905423686e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.37.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.59159299073508e-06, + "sensitivity": 2.1044061654883115 + }, + { + "name": "model.layers.37.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 7.091897714417428e-06, + "sensitivity": 2.2035368899941923 + }, + { + "name": "model.layers.37.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00019590994634199888, + "sensitivity": 0.9431856680704118 + }, + { + "name": "model.layers.37.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.425206119165523e-05, + "sensitivity": 1.3999416397039393 + }, + { + "name": "model.layers.37.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 2, + "mse": 0.0006590730044990778, + "sensitivity": 0.5898597784443735 + }, + { + "name": "model.layers.37.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0003035494592040777, + "sensitivity": 0.7966544857602197 + }, + { + "name": "model.layers.38.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0736963304225355e-05, + "sensitivity": 1.4450468119761855 + }, + { + "name": "model.layers.38.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1331335372233298e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.870965833310038e-05, + "sensitivity": 0.6737918066876849 + }, + { + "name": "model.layers.38.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.063057662686333e-05, + "sensitivity": 0.8598348090894042 + }, + { + "name": "model.layers.38.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1859704045491526e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006938841543160379, + "sensitivity": 0.5472672600634879 + }, + { + "name": "model.layers.38.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4126607058860827e-06, + "sensitivity": 2.0972644224919708 + }, + { + "name": "model.layers.38.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.511306989727018e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007238363614305854, + "sensitivity": 0.5279065111537898 + }, + { + "name": "model.layers.38.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0728678363375366e-05, + "sensitivity": 0.7704957850408932 + }, + { + "name": "model.layers.38.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.331730552730733e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006947300862520933, + "sensitivity": 0.5429552792631855 + }, + { + "name": "model.layers.38.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.678594970959239e-05, + "sensitivity": 0.9333033528226451 + }, + { + "name": "model.layers.38.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1642458730420913e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.570552821154706e-05, + "sensitivity": 0.6333797279466585 + }, + { + "name": "model.layers.38.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1423270734667312e-05, + "sensitivity": 1.967436677731432 + }, + { + "name": "model.layers.38.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5442030871781753e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.082516483729705e-05, + "sensitivity": 0.8879931041445531 + }, + { + "name": "model.layers.38.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.811582013848238e-05, + "sensitivity": 0.7997905184011174 + }, + { + "name": "model.layers.38.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.061641321750358e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006506051868200302, + "sensitivity": 0.5800605825678663 + }, + { + "name": "model.layers.38.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.377868703566492e-05, + "sensitivity": 0.6536306710330402 + }, + { + "name": "model.layers.38.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.996768888711813e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007458789041265845, + "sensitivity": 0.552765640176303 + }, + { + "name": "model.layers.38.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0259142628638074e-05, + "sensitivity": 0.6884224931963461 + }, + { + "name": "model.layers.38.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.461678362436942e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000696134171448648, + "sensitivity": 0.5129081050464646 + }, + { + "name": "model.layers.38.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.561011832673103e-05, + "sensitivity": 0.6264457918862952 + }, + { + "name": "model.layers.38.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.929504815569089e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007240357808768749, + "sensitivity": 0.5412743854788815 + }, + { + "name": "model.layers.38.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006758588133379817, + "sensitivity": 0.5482703139385345 + }, + { + "name": "model.layers.38.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.677696546830703e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006702930550090969, + "sensitivity": 0.5298997387460779 + }, + { + "name": "model.layers.38.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0498922165425029e-05, + "sensitivity": 1.7208293134417527 + }, + { + "name": "model.layers.38.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.05564184247487e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006177224568091333, + "sensitivity": 0.5778145635366704 + }, + { + "name": "model.layers.38.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.383556319633499e-05, + "sensitivity": 0.650148350434733 + }, + { + "name": "model.layers.38.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.361405659547017e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007266210741363466, + "sensitivity": 0.5254834461359391 + }, + { + "name": "model.layers.38.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.280293746385723e-05, + "sensitivity": 0.804707161420599 + }, + { + "name": "model.layers.38.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.458293905277969e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006981625920161605, + "sensitivity": 0.5814683516531027 + }, + { + "name": "model.layers.38.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.380418926710263e-05, + "sensitivity": 0.6336346515343672 + }, + { + "name": "model.layers.38.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.381045179499779e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007400352042168379, + "sensitivity": 0.5457607789702074 + }, + { + "name": "model.layers.38.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.308348383754492e-05, + "sensitivity": 0.7895229864661133 + }, + { + "name": "model.layers.38.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.162410267686937e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006920917658135295, + "sensitivity": 0.5414423890813646 + }, + { + "name": "model.layers.38.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.17111218161881e-05, + "sensitivity": 0.9261949515672412 + }, + { + "name": "model.layers.38.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.448383030350669e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007183767738752067, + "sensitivity": 0.5116324217371451 + }, + { + "name": "model.layers.38.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.549419777002186e-05, + "sensitivity": 0.6446354045413943 + }, + { + "name": "model.layers.38.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.004338608065154e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007221675477921963, + "sensitivity": 0.5822686108475714 + }, + { + "name": "model.layers.38.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.869466986041516e-05, + "sensitivity": 0.8778600361072899 + }, + { + "name": "model.layers.38.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.868595043371897e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.166766252135858e-05, + "sensitivity": 0.6145040325997222 + }, + { + "name": "model.layers.38.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.915674410061911e-05, + "sensitivity": 0.6713044429138317 + }, + { + "name": "model.layers.38.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.456653972643835e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006673064781352878, + "sensitivity": 0.5240878536480446 + }, + { + "name": "model.layers.38.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.572407437488437e-05, + "sensitivity": 0.6222399476011043 + }, + { + "name": "model.layers.38.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.821663979892037e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007359473966062069, + "sensitivity": 0.5371415374473388 + }, + { + "name": "model.layers.38.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.703104397980496e-05, + "sensitivity": 1.085422717291598 + }, + { + "name": "model.layers.38.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.555099159617384e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006517720175907016, + "sensitivity": 0.5528293805016399 + }, + { + "name": "model.layers.38.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1577378245419823e-05, + "sensitivity": 1.7077207007975004 + }, + { + "name": "model.layers.38.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.164510856862762e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.203556404216215e-05, + "sensitivity": 0.7083354980680456 + }, + { + "name": "model.layers.38.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6880518968682736e-05, + "sensitivity": 0.9325231815145922 + }, + { + "name": "model.layers.38.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0176053137911367e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006210339488461614, + "sensitivity": 0.5453678415415362 + }, + { + "name": "model.layers.38.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.408622721210122e-05, + "sensitivity": 0.611026328930356 + }, + { + "name": "model.layers.38.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.731653113296488e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007151947356760502, + "sensitivity": 0.5175118594333733 + }, + { + "name": "model.layers.38.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.1031445511616766e-05, + "sensitivity": 0.8050350946567719 + }, + { + "name": "model.layers.38.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.510345080343541e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006841346621513367, + "sensitivity": 0.5633464371178575 + }, + { + "name": "model.layers.38.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.3143343393458053e-05, + "sensitivity": 0.7645179687406712 + }, + { + "name": "model.layers.38.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0193438129135757e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006647929549217224, + "sensitivity": 0.5967343195817375 + }, + { + "name": "model.layers.38.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.769041308667511e-05, + "sensitivity": 0.7927742273244132 + }, + { + "name": "model.layers.38.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.137312438004301e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9421050536911935e-05, + "sensitivity": 0.6526393083462011 + }, + { + "name": "model.layers.38.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7862838730216026e-05, + "sensitivity": 0.9473071246328705 + }, + { + "name": "model.layers.38.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.991072266122501e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.85821398999542e-05, + "sensitivity": 0.7826239638919337 + }, + { + "name": "model.layers.38.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.164536171127111e-05, + "sensitivity": 0.6105057223448729 + }, + { + "name": "model.layers.38.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.666500773164444e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006874680984765291, + "sensitivity": 0.5786716442131148 + }, + { + "name": "model.layers.38.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.196635513333604e-05, + "sensitivity": 0.7532722795094581 + }, + { + "name": "model.layers.38.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.961955811377265e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000682518701069057, + "sensitivity": 0.5714278202388292 + }, + { + "name": "model.layers.38.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.2158768186054658e-05, + "sensitivity": 1.5966347617693764 + }, + { + "name": "model.layers.38.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0647603403413086e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007416459266096354, + "sensitivity": 0.5235640456118038 + }, + { + "name": "model.layers.38.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006940662860870361, + "sensitivity": 0.5618557854353237 + }, + { + "name": "model.layers.38.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.60805436989176e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.192050932440907e-05, + "sensitivity": 0.8173388486005975 + }, + { + "name": "model.layers.38.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1720292604877613e-05, + "sensitivity": 1.7655637718487405 + }, + { + "name": "model.layers.38.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.750500117253978e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007173746707849205, + "sensitivity": 0.5435131589486102 + }, + { + "name": "model.layers.38.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.979033812764101e-05, + "sensitivity": 1.135255361274395 + }, + { + "name": "model.layers.38.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2596987062352127e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.2996417353861034e-05, + "sensitivity": 1.9063396529536423 + }, + { + "name": "model.layers.38.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.800568760605529e-05, + "sensitivity": 0.7146855740234075 + }, + { + "name": "model.layers.38.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0921083912762697e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0395701439119875e-05, + "sensitivity": 0.7230410049783462 + }, + { + "name": "model.layers.38.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.999011773383245e-05, + "sensitivity": 0.9924456461320095 + }, + { + "name": "model.layers.38.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.194724839289847e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.986793985357508e-05, + "sensitivity": 0.6898269190014378 + }, + { + "name": "model.layers.38.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006816412205807865, + "sensitivity": 0.5752718719741018 + }, + { + "name": "model.layers.38.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.284106343126041e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006688748835586011, + "sensitivity": 0.5305661507782721 + }, + { + "name": "model.layers.38.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.840432640979998e-05, + "sensitivity": 0.7908319874086872 + }, + { + "name": "model.layers.38.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.161337975958304e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006623369408771396, + "sensitivity": 0.5650900944018682 + }, + { + "name": "model.layers.38.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.522317223949358e-05, + "sensitivity": 0.874938698699304 + }, + { + "name": "model.layers.38.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.459506031817e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7271325204055756e-05, + "sensitivity": 0.6488818234880716 + }, + { + "name": "model.layers.38.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.22064180788584e-05, + "sensitivity": 0.6225092133515171 + }, + { + "name": "model.layers.38.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.114087353926152e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.233610474737361e-05, + "sensitivity": 0.6140325260718644 + }, + { + "name": "model.layers.38.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.801624840591103e-05, + "sensitivity": 0.8182234792255381 + }, + { + "name": "model.layers.38.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.894464258446533e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007674290100112557, + "sensitivity": 0.5995419781952531 + }, + { + "name": "model.layers.38.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.830479130963795e-05, + "sensitivity": 0.8101819674126365 + }, + { + "name": "model.layers.38.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.794924385962076e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006686918204650283, + "sensitivity": 0.5775589901206843 + }, + { + "name": "model.layers.38.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.046903945389204e-05, + "sensitivity": 0.6401360978656252 + }, + { + "name": "model.layers.38.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.115149855962954e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006707264110445976, + "sensitivity": 0.5470896253240305 + }, + { + "name": "model.layers.38.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1144637937832158e-05, + "sensitivity": 1.2138131898756135 + }, + { + "name": "model.layers.38.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.647925824334379e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006737086805514991, + "sensitivity": 0.5272079686142046 + }, + { + "name": "model.layers.38.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.897700692818034e-06, + "sensitivity": 1.8399447774431854 + }, + { + "name": "model.layers.38.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.195443473989144e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006632436998188496, + "sensitivity": 0.5220072817727663 + }, + { + "name": "model.layers.38.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.678798672510311e-05, + "sensitivity": 0.6682461626713371 + }, + { + "name": "model.layers.38.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2090803238606895e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007542503881268203, + "sensitivity": 0.5239839144945017 + }, + { + "name": "model.layers.38.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0863640101160854e-05, + "sensitivity": 0.7556599921199358 + }, + { + "name": "model.layers.38.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0096244977830793e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.927976962993853e-05, + "sensitivity": 0.6249112004967459 + }, + { + "name": "model.layers.38.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.176536408020183e-05, + "sensitivity": 0.814277874146613 + }, + { + "name": "model.layers.38.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1035315310437e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006802745047025383, + "sensitivity": 0.5551582407974782 + }, + { + "name": "model.layers.38.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.704093200620264e-05, + "sensitivity": 0.7778790875137334 + }, + { + "name": "model.layers.38.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.086074462364195e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006411084905266762, + "sensitivity": 0.5432472540871147 + }, + { + "name": "model.layers.38.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.818324279971421e-05, + "sensitivity": 0.7338413233696585 + }, + { + "name": "model.layers.38.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.402800636351458e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006578720058314502, + "sensitivity": 0.5269159813730493 + }, + { + "name": "model.layers.38.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.928318569203839e-05, + "sensitivity": 0.9053979458792205 + }, + { + "name": "model.layers.38.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.917759603515151e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.179577758302912e-05, + "sensitivity": 0.8914989525133694 + }, + { + "name": "model.layers.38.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.106749060563743e-05, + "sensitivity": 0.6627390462730558 + }, + { + "name": "model.layers.38.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.105386430339422e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006960115279071033, + "sensitivity": 0.5304644745238295 + }, + { + "name": "model.layers.38.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.87084102537483e-05, + "sensitivity": 0.6550178697787897 + }, + { + "name": "model.layers.38.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.397425628776546e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007630162872374058, + "sensitivity": 0.5459293869206491 + }, + { + "name": "model.layers.38.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1009549780283123e-05, + "sensitivity": 1.2550138297930702 + }, + { + "name": "model.layers.38.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.8839950826077256e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.587643292732537e-05, + "sensitivity": 0.765763643119126 + }, + { + "name": "model.layers.38.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1342013749526814e-05, + "sensitivity": 1.2012000882374338 + }, + { + "name": "model.layers.38.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2528583965831785e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007030301494523883, + "sensitivity": 0.5622507603511799 + }, + { + "name": "model.layers.38.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1798299965448678e-05, + "sensitivity": 1.7084111376727675 + }, + { + "name": "model.layers.38.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6336357475665864e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007041497156023979, + "sensitivity": 0.5616675308516614 + }, + { + "name": "model.layers.38.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007002138299867511, + "sensitivity": 0.5290153853068132 + }, + { + "name": "model.layers.38.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.02783552242181e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007168317097239196, + "sensitivity": 0.5739676205701342 + }, + { + "name": "model.layers.38.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1702543815772515e-05, + "sensitivity": 1.3104003358901097 + }, + { + "name": "model.layers.38.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.548892083126702e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007107759593054652, + "sensitivity": 0.5229263627977203 + }, + { + "name": "model.layers.38.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007367608486674726, + "sensitivity": 0.5348070909796999 + }, + { + "name": "model.layers.38.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.888032544338785e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007247903267852962, + "sensitivity": 0.5585633946410412 + }, + { + "name": "model.layers.38.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.093040039762855e-05, + "sensitivity": 1.018133381045087 + }, + { + "name": "model.layers.38.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1163078852405306e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000812046870123595, + "sensitivity": 0.539915229174407 + }, + { + "name": "model.layers.38.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.454921059324988e-06, + "sensitivity": 2.0976757888695823 + }, + { + "name": "model.layers.38.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2335585779510438e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007022731006145477, + "sensitivity": 0.532231430008083 + }, + { + "name": "model.layers.38.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6060780480038375e-05, + "sensitivity": 1.0235226563667443 + }, + { + "name": "model.layers.38.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.194548968276649e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006166922394186258, + "sensitivity": 0.5507257267935605 + }, + { + "name": "model.layers.38.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0579109584796242e-05, + "sensitivity": 1.7146943020678687 + }, + { + "name": "model.layers.38.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.357883416465484e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006664595566689968, + "sensitivity": 0.5543239991414078 + }, + { + "name": "model.layers.38.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 1.9770945982600097e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.5424553768971236e-06, + "sensitivity": 2.103727085689983 + }, + { + "name": "model.layers.38.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 3.148520136164734e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.38.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.6506267002114328e-06, + "sensitivity": 2.1063539667222337 + }, + { + "name": "model.layers.38.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 3.493807162158191e-05, + "sensitivity": 1.9371376998954295 + }, + { + "name": "model.layers.38.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00022416333376895636, + "sensitivity": 0.8421219746571228 + }, + { + "name": "model.layers.38.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.6650426914566197e-05, + "sensitivity": 1.1718413829074892 + }, + { + "name": "model.layers.38.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 2, + "mse": 0.0006198073970153928, + "sensitivity": 0.5865038575004429 + }, + { + "name": "model.layers.38.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0003171184507664293, + "sensitivity": 0.7989223125306852 + }, + { + "name": "model.layers.39.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.476622754940763e-05, + "sensitivity": 0.7100612746416621 + }, + { + "name": "model.layers.39.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.140794645645656e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.648127626045607e-05, + "sensitivity": 0.6524057645401786 + }, + { + "name": "model.layers.39.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0538372407609131e-05, + "sensitivity": 1.206694647969812 + }, + { + "name": "model.layers.39.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.662712278033723e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006327390437945724, + "sensitivity": 0.5244607854412868 + }, + { + "name": "model.layers.39.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.211384607013315e-05, + "sensitivity": 0.8091823695630146 + }, + { + "name": "model.layers.39.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.918660796553013e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006852350197732449, + "sensitivity": 0.5166797254341666 + }, + { + "name": "model.layers.39.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.262149716145359e-05, + "sensitivity": 0.6693471995226878 + }, + { + "name": "model.layers.39.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.623521464163787e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006473431130871177, + "sensitivity": 0.5398393426171926 + }, + { + "name": "model.layers.39.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0703110648319125e-05, + "sensitivity": 0.9533739002912123 + }, + { + "name": "model.layers.39.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.748055281808774e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000656831543892622, + "sensitivity": 0.5549131028197842 + }, + { + "name": "model.layers.39.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006682753446511924, + "sensitivity": 0.5912047287791475 + }, + { + "name": "model.layers.39.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.752957233402412e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006577134481631219, + "sensitivity": 0.5238076550286463 + }, + { + "name": "model.layers.39.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.932372732786462e-05, + "sensitivity": 0.7790726773759558 + }, + { + "name": "model.layers.39.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.812831649469445e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.734008300350979e-05, + "sensitivity": 0.6293440480377281 + }, + { + "name": "model.layers.39.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006904881447553635, + "sensitivity": 0.5432123620845792 + }, + { + "name": "model.layers.39.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.753922315918317e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006968089728616178, + "sensitivity": 0.5253282480979053 + }, + { + "name": "model.layers.39.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 2.1473522792803124e-05, + "sensitivity": 0.7930698346433771 + }, + { + "name": "model.layers.39.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.115224560839124e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.4389831449079793e-05, + "sensitivity": 1.3108654370863408 + }, + { + "name": "model.layers.39.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0520644536882173e-05, + "sensitivity": 1.3711253804553913 + }, + { + "name": "model.layers.39.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3528127738027251e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.73063844058197e-05, + "sensitivity": 0.6557413613889793 + }, + { + "name": "model.layers.39.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.127559026936069e-05, + "sensitivity": 0.643997713392706 + }, + { + "name": "model.layers.39.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.864417739256169e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000683668302372098, + "sensitivity": 0.5045415624879863 + }, + { + "name": "model.layers.39.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006644650129601359, + "sensitivity": 0.5573927013725228 + }, + { + "name": "model.layers.39.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.684145089115191e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006450671935454011, + "sensitivity": 0.5187871378924244 + }, + { + "name": "model.layers.39.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.973321822239086e-05, + "sensitivity": 0.704934521182819 + }, + { + "name": "model.layers.39.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.78963453740289e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006597192259505391, + "sensitivity": 0.5160457484352768 + }, + { + "name": "model.layers.39.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.079169543227181e-05, + "sensitivity": 0.8022650142507949 + }, + { + "name": "model.layers.39.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.042226570774801e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006857478874735534, + "sensitivity": 0.548207998958497 + }, + { + "name": "model.layers.39.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006955274729989469, + "sensitivity": 0.5680190199981747 + }, + { + "name": "model.layers.39.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.36810272630828e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006839379202574492, + "sensitivity": 0.5366654801834161 + }, + { + "name": "model.layers.39.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9485097153810784e-05, + "sensitivity": 1.0272079247369683 + }, + { + "name": "model.layers.39.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.161619007296395e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006585874943993986, + "sensitivity": 0.5656811778149674 + }, + { + "name": "model.layers.39.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.266870332183316e-05, + "sensitivity": 0.6142284635658392 + }, + { + "name": "model.layers.39.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0610835943225538e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006683479296043515, + "sensitivity": 0.5410522825960149 + }, + { + "name": "model.layers.39.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.70434785913676e-05, + "sensitivity": 0.9346192318594475 + }, + { + "name": "model.layers.39.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.60811303734954e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.851740934303962e-05, + "sensitivity": 0.6916749368442041 + }, + { + "name": "model.layers.39.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.289083103183657e-05, + "sensitivity": 0.6514957987878518 + }, + { + "name": "model.layers.39.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.290964276762679e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.432915688492358e-05, + "sensitivity": 0.6130050081736167 + }, + { + "name": "model.layers.39.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.242296512937173e-05, + "sensitivity": 0.7031621542359285 + }, + { + "name": "model.layers.39.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.678588301336276e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.378129910444841e-05, + "sensitivity": 0.7100494938585319 + }, + { + "name": "model.layers.39.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007381384493783116, + "sensitivity": 0.5774468796435133 + }, + { + "name": "model.layers.39.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.804241022313363e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007333490066230297, + "sensitivity": 0.5193006075985804 + }, + { + "name": "model.layers.39.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0435429430799559e-05, + "sensitivity": 1.3987483311705913 + }, + { + "name": "model.layers.39.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0323344667995116e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0577607655432075e-05, + "sensitivity": 0.8955970264849787 + }, + { + "name": "model.layers.39.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1491849363665096e-05, + "sensitivity": 1.665850294701982 + }, + { + "name": "model.layers.39.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 3.170221589243738e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006805482553318143, + "sensitivity": 0.5596758954636547 + }, + { + "name": "model.layers.39.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.986378245230298e-06, + "sensitivity": 1.8937587377268428 + }, + { + "name": "model.layers.39.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3215703802416101e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.086035162094049e-05, + "sensitivity": 0.8345954554645236 + }, + { + "name": "model.layers.39.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0770621884148568e-05, + "sensitivity": 1.2814017965208755 + }, + { + "name": "model.layers.39.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.494630835935823e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006537455483339727, + "sensitivity": 0.5970699044888687 + }, + { + "name": "model.layers.39.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0423422837629914e-05, + "sensitivity": 0.6227683503793028 + }, + { + "name": "model.layers.39.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.98616383690387e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.198982009664178e-05, + "sensitivity": 0.6833482509933733 + }, + { + "name": "model.layers.39.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.023680907674134e-05, + "sensitivity": 0.8269617170411199 + }, + { + "name": "model.layers.39.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.481649385634228e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006717643700540066, + "sensitivity": 0.5137886567469321 + }, + { + "name": "model.layers.39.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006721188547089696, + "sensitivity": 0.5938252827967154 + }, + { + "name": "model.layers.39.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.990604444785276e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.04111046413891e-05, + "sensitivity": 0.6408955522232588 + }, + { + "name": "model.layers.39.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.7361356842448004e-06, + "sensitivity": 2.043403886084076 + }, + { + "name": "model.layers.39.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0014427971327677e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.925461639184505e-05, + "sensitivity": 0.6079326658229092 + }, + { + "name": "model.layers.39.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8652294683270156e-05, + "sensitivity": 1.1065439537262416 + }, + { + "name": "model.layers.39.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.393300620606169e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006562386406585574, + "sensitivity": 0.5639461269711041 + }, + { + "name": "model.layers.39.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007083863019943237, + "sensitivity": 0.5529114478539646 + }, + { + "name": "model.layers.39.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.899235813762061e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006930408999323845, + "sensitivity": 0.5616893920714676 + }, + { + "name": "model.layers.39.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.225090328371152e-05, + "sensitivity": 0.8113280813529479 + }, + { + "name": "model.layers.39.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.470771379303187e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.253809260670096e-05, + "sensitivity": 0.7712066241099206 + }, + { + "name": "model.layers.39.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1600927791732829e-05, + "sensitivity": 1.2516683917041294 + }, + { + "name": "model.layers.39.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.959716074561584e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006799572147428989, + "sensitivity": 0.5438361846779335 + }, + { + "name": "model.layers.39.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0600250789138954e-05, + "sensitivity": 1.3243370687592704 + }, + { + "name": "model.layers.39.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.345240303242463e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.119362999219447e-05, + "sensitivity": 0.6046896564761632 + }, + { + "name": "model.layers.39.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.448876618174836e-05, + "sensitivity": 1.1911252153280665 + }, + { + "name": "model.layers.39.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.438641548811574e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.4672229452989995e-05, + "sensitivity": 0.6305648166994127 + }, + { + "name": "model.layers.39.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1219084626645781e-05, + "sensitivity": 1.2869700113300997 + }, + { + "name": "model.layers.39.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.919267540681176e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006720914389006793, + "sensitivity": 0.5513354820635449 + }, + { + "name": "model.layers.39.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.655768083874136e-05, + "sensitivity": 0.9031072482191946 + }, + { + "name": "model.layers.39.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.071352244252921e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007671565981581807, + "sensitivity": 0.5139005623911344 + }, + { + "name": "model.layers.39.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.505981243913993e-05, + "sensitivity": 0.7783680316009035 + }, + { + "name": "model.layers.39.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0032263162429444e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005943889264017344, + "sensitivity": 0.562977440384917 + }, + { + "name": "model.layers.39.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9551093727350235e-05, + "sensitivity": 1.1519919714173843 + }, + { + "name": "model.layers.39.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2763093764078803e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.389725604094565e-05, + "sensitivity": 0.6269457640661141 + }, + { + "name": "model.layers.39.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0118163673905656e-05, + "sensitivity": 0.8780587219607586 + }, + { + "name": "model.layers.39.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.164872156157799e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006721747922711074, + "sensitivity": 0.5327180638557969 + }, + { + "name": "model.layers.39.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1105941666755825e-05, + "sensitivity": 1.212706536766602 + }, + { + "name": "model.layers.39.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.915624908288009e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006826884346082807, + "sensitivity": 0.5174000358002846 + }, + { + "name": "model.layers.39.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.184406083775684e-05, + "sensitivity": 0.7013552858728911 + }, + { + "name": "model.layers.39.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.733765414741356e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006869544158689678, + "sensitivity": 0.5375295132409327 + }, + { + "name": "model.layers.39.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.2240674297790974e-06, + "sensitivity": 2.0973038619525926 + }, + { + "name": "model.layers.39.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.98394511952938e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006719360826537013, + "sensitivity": 0.551211231169531 + }, + { + "name": "model.layers.39.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.625151581829414e-05, + "sensitivity": 0.7921709592767918 + }, + { + "name": "model.layers.39.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.837179734655365e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007439572364091873, + "sensitivity": 0.5961308960590006 + }, + { + "name": "model.layers.39.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.727499956265092e-05, + "sensitivity": 0.8725677666147085 + }, + { + "name": "model.layers.39.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.990274065785343e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006342043052427471, + "sensitivity": 0.5294861475378808 + }, + { + "name": "model.layers.39.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1400926268834155e-05, + "sensitivity": 1.382493598680396 + }, + { + "name": "model.layers.39.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.372045400989009e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.053807373973541e-05, + "sensitivity": 0.7337771771169108 + }, + { + "name": "model.layers.39.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7774515880737454e-05, + "sensitivity": 0.7815003394631265 + }, + { + "name": "model.layers.39.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1994748092547525e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006434351671487093, + "sensitivity": 0.5981944598392975 + }, + { + "name": "model.layers.39.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.646948920912109e-05, + "sensitivity": 0.7369908125173755 + }, + { + "name": "model.layers.39.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.640923851999105e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006283233524300158, + "sensitivity": 0.545940575552214 + }, + { + "name": "model.layers.39.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.0981829038646538e-06, + "sensitivity": 2.0970718765438763 + }, + { + "name": "model.layers.39.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.951515274522535e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7861427194438875e-05, + "sensitivity": 0.6026762774925586 + }, + { + "name": "model.layers.39.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.921417323406786e-05, + "sensitivity": 0.8378957999059257 + }, + { + "name": "model.layers.39.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.193703138204e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006554603460244834, + "sensitivity": 0.49314366421501654 + }, + { + "name": "model.layers.39.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0786752682179213e-05, + "sensitivity": 1.2452967157671249 + }, + { + "name": "model.layers.39.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0107200978382025e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.075889541534707e-05, + "sensitivity": 0.6320838294192164 + }, + { + "name": "model.layers.39.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.062581087462604e-05, + "sensitivity": 1.0911652309922621 + }, + { + "name": "model.layers.39.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.476967536807933e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006886426126584411, + "sensitivity": 0.5446675780007126 + }, + { + "name": "model.layers.39.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.724030779674649e-05, + "sensitivity": 0.8387992189104132 + }, + { + "name": "model.layers.39.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.817422667561914e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006621055072173476, + "sensitivity": 0.5145803498293915 + }, + { + "name": "model.layers.39.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.234316970221698e-05, + "sensitivity": 0.8433676454876173 + }, + { + "name": "model.layers.39.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.504972487964551e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.500181916635484e-05, + "sensitivity": 0.6013117411086724 + }, + { + "name": "model.layers.39.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.874373502796516e-05, + "sensitivity": 0.6904920428135264 + }, + { + "name": "model.layers.39.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0303363069397165e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007854144787415862, + "sensitivity": 0.5303263720866759 + }, + { + "name": "model.layers.39.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006808532634750009, + "sensitivity": 0.5321442712418644 + }, + { + "name": "model.layers.39.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.530355787821463e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.983895971439779e-05, + "sensitivity": 0.6002345346811967 + }, + { + "name": "model.layers.39.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1299083780613728e-05, + "sensitivity": 1.2197915405592077 + }, + { + "name": "model.layers.39.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.7910409724208876e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006881991284899414, + "sensitivity": 0.5951311648450504 + }, + { + "name": "model.layers.39.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007021564524620771, + "sensitivity": 0.5895181583567696 + }, + { + "name": "model.layers.39.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.887436138138582e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007092795567587018, + "sensitivity": 0.5452753474011182 + }, + { + "name": "model.layers.39.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.066477362764999e-05, + "sensitivity": 0.6501283636861791 + }, + { + "name": "model.layers.39.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.930823014452471e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006670200964435935, + "sensitivity": 0.5631563706580901 + }, + { + "name": "model.layers.39.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1048219676013105e-05, + "sensitivity": 1.2079174434314417 + }, + { + "name": "model.layers.39.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.335081022574741e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007050953572615981, + "sensitivity": 0.5784771445204531 + }, + { + "name": "model.layers.39.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006752251647412777, + "sensitivity": 0.5125080509255288 + }, + { + "name": "model.layers.39.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.54157588542148e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000665098603349179, + "sensitivity": 0.5064372522714233 + }, + { + "name": "model.layers.39.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 9.60523266257951e-06, + "sensitivity": 1.8719539008965573 + }, + { + "name": "model.layers.39.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.970683100211318e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0005875746719539165, + "sensitivity": 0.5260312906544403 + }, + { + "name": "model.layers.39.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.758394763688557e-05, + "sensitivity": 0.7770837608394059 + }, + { + "name": "model.layers.39.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.413449682440842e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006510838866233826, + "sensitivity": 0.5287501355776854 + }, + { + "name": "model.layers.39.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.15068493061699e-05, + "sensitivity": 0.6042068954172409 + }, + { + "name": "model.layers.39.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1690462997648865e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006654210155829787, + "sensitivity": 0.5854190036145648 + }, + { + "name": "model.layers.39.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 1.8469082760930178e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.5433862447243882e-06, + "sensitivity": 2.1043377456269607 + }, + { + "name": "model.layers.39.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 3.165350335621042e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.39.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.5586573454129393e-06, + "sensitivity": 2.1054101712091966 + }, + { + "name": "model.layers.39.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 4, + "mse": 3.6057423130841926e-05, + "sensitivity": 1.8086148419977652 + }, + { + "name": "model.layers.39.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.000211276113986969, + "sensitivity": 0.8069112452484706 + }, + { + "name": "model.layers.39.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.752154275891371e-05, + "sensitivity": 1.264455218254882 + }, + { + "name": "model.layers.39.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 4.6707205910934135e-05, + "sensitivity": 0.6667339867498504 + }, + { + "name": "model.layers.39.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0003304955898784101, + "sensitivity": 0.8798343819188216 + }, + { + "name": "model.layers.40.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8121087931795046e-05, + "sensitivity": 0.8178516364461677 + }, + { + "name": "model.layers.40.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.341753527929541e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.962352952337824e-05, + "sensitivity": 0.6812436505778894 + }, + { + "name": "model.layers.40.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.405886233551428e-05, + "sensitivity": 0.8736066557977898 + }, + { + "name": "model.layers.40.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.959762792277616e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007012709975242615, + "sensitivity": 0.5481768485665837 + }, + { + "name": "model.layers.40.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.817396959173493e-05, + "sensitivity": 0.9177336908885451 + }, + { + "name": "model.layers.40.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.395125175615249e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.199230847414583e-05, + "sensitivity": 0.7177849777709726 + }, + { + "name": "model.layers.40.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.5113322408287786e-06, + "sensitivity": 2.097809060723284 + }, + { + "name": "model.layers.40.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0233904959022766e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000708649109583348, + "sensitivity": 0.5353973386708811 + }, + { + "name": "model.layers.40.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007038149051368237, + "sensitivity": 0.5657141227728213 + }, + { + "name": "model.layers.40.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.672929657725035e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006967965746298432, + "sensitivity": 0.5287922694648037 + }, + { + "name": "model.layers.40.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7869834563462064e-05, + "sensitivity": 0.7075894401030691 + }, + { + "name": "model.layers.40.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.526347189923399e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006654573371633887, + "sensitivity": 0.527429576756727 + }, + { + "name": "model.layers.40.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.737847459386103e-05, + "sensitivity": 0.841907764806302 + }, + { + "name": "model.layers.40.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.213694400183158e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006513843545690179, + "sensitivity": 0.5163190298255367 + }, + { + "name": "model.layers.40.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.621115608140826e-05, + "sensitivity": 1.166857040449122 + }, + { + "name": "model.layers.40.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2210372233312228e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.809942715335637e-05, + "sensitivity": 0.6944964058575638 + }, + { + "name": "model.layers.40.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.19883940089494e-05, + "sensitivity": 0.6823616538286863 + }, + { + "name": "model.layers.40.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.335016789511428e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006859757704660296, + "sensitivity": 0.537409152042701 + }, + { + "name": "model.layers.40.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.066107744118199e-05, + "sensitivity": 1.1821976805641325 + }, + { + "name": "model.layers.40.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.797085572747164e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006700476515106857, + "sensitivity": 0.5874059759940562 + }, + { + "name": "model.layers.40.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.625667836284265e-05, + "sensitivity": 0.9408559566292883 + }, + { + "name": "model.layers.40.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.814019227225799e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006354874931275845, + "sensitivity": 0.5032430401995172 + }, + { + "name": "model.layers.40.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.743294605053961e-05, + "sensitivity": 1.052790293838426 + }, + { + "name": "model.layers.40.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0851209708562237e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000644017243757844, + "sensitivity": 0.5443894649166089 + }, + { + "name": "model.layers.40.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.42257509753108e-05, + "sensitivity": 0.873540188177285 + }, + { + "name": "model.layers.40.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.513713621345232e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00074167107231915, + "sensitivity": 0.5096240122157427 + }, + { + "name": "model.layers.40.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1970626474067103e-05, + "sensitivity": 1.3076308095874911 + }, + { + "name": "model.layers.40.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.289802053695894e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007564167026430368, + "sensitivity": 0.5654844866626042 + }, + { + "name": "model.layers.40.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.871427129022777e-05, + "sensitivity": 0.8801380603145604 + }, + { + "name": "model.layers.40.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.724059744556143e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006581732886843383, + "sensitivity": 0.5542626829707376 + }, + { + "name": "model.layers.40.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006891795201227069, + "sensitivity": 0.5460115770292574 + }, + { + "name": "model.layers.40.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.923263408178173e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006830228376202285, + "sensitivity": 0.5610455670300544 + }, + { + "name": "model.layers.40.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.138946628198028e-05, + "sensitivity": 0.8273367704431015 + }, + { + "name": "model.layers.40.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.86518910445011e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006641907384619117, + "sensitivity": 0.5247007686874113 + }, + { + "name": "model.layers.40.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.592979480046779e-05, + "sensitivity": 0.624622927790186 + }, + { + "name": "model.layers.40.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1319635859763366e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.37564662611112e-05, + "sensitivity": 0.6405328797655624 + }, + { + "name": "model.layers.40.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.167396350065246e-05, + "sensitivity": 0.9460566592544228 + }, + { + "name": "model.layers.40.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2082720104444888e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007024985970929265, + "sensitivity": 0.5835881133858595 + }, + { + "name": "model.layers.40.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1857850040541962e-05, + "sensitivity": 1.361629432937203 + }, + { + "name": "model.layers.40.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4418841374208569e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.028022471582517e-05, + "sensitivity": 0.785790759146431 + }, + { + "name": "model.layers.40.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0854228094103746e-05, + "sensitivity": 1.5195395785628663 + }, + { + "name": "model.layers.40.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.952653848202317e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.991497164359316e-05, + "sensitivity": 0.7290266965503246 + }, + { + "name": "model.layers.40.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9892576246056706e-05, + "sensitivity": 1.02604805685159 + }, + { + "name": "model.layers.40.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1201180996067706e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006396970129571855, + "sensitivity": 0.5653383470234207 + }, + { + "name": "model.layers.40.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1049184649891686e-05, + "sensitivity": 1.5032121094235942 + }, + { + "name": "model.layers.40.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0839253263839055e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.860087912878953e-05, + "sensitivity": 0.7716582170119777 + }, + { + "name": "model.layers.40.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0773538280045614e-05, + "sensitivity": 0.6146371628167426 + }, + { + "name": "model.layers.40.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.59762473939918e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.958662222838029e-05, + "sensitivity": 0.6343307621519229 + }, + { + "name": "model.layers.40.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.885143036721274e-05, + "sensitivity": 1.1576873430163013 + }, + { + "name": "model.layers.40.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.590540687691828e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.839686491526663e-05, + "sensitivity": 0.6288812532872442 + }, + { + "name": "model.layers.40.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8698904467746615e-05, + "sensitivity": 1.0926980244585291 + }, + { + "name": "model.layers.40.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.802882914300426e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.958421388641e-05, + "sensitivity": 0.716836638056771 + }, + { + "name": "model.layers.40.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.436802505049855e-05, + "sensitivity": 0.8627727070667928 + }, + { + "name": "model.layers.40.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.178882697189692e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007029238040558994, + "sensitivity": 0.5303473133785008 + }, + { + "name": "model.layers.40.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.03547484590672e-05, + "sensitivity": 0.7808772041245244 + }, + { + "name": "model.layers.40.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0011483482230688e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.277500844793394e-05, + "sensitivity": 0.6092796425528677 + }, + { + "name": "model.layers.40.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1635862392722629e-05, + "sensitivity": 1.8765914296092248 + }, + { + "name": "model.layers.40.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2285989896554383e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.045298505341634e-05, + "sensitivity": 0.6800174379388412 + }, + { + "name": "model.layers.40.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.534165004268289e-05, + "sensitivity": 0.6138151745338231 + }, + { + "name": "model.layers.40.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.595785286364844e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.375550583470613e-05, + "sensitivity": 0.6090123459742544 + }, + { + "name": "model.layers.40.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.405618478311226e-05, + "sensitivity": 0.7771500723526146 + }, + { + "name": "model.layers.40.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.998283197390265e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.370826304191723e-05, + "sensitivity": 0.6611920125826133 + }, + { + "name": "model.layers.40.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.470950756920502e-05, + "sensitivity": 0.7402160600942838 + }, + { + "name": "model.layers.40.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.65752269874065e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007121765520423651, + "sensitivity": 0.5262406588178846 + }, + { + "name": "model.layers.40.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9131427406100556e-05, + "sensitivity": 1.0450480074874315 + }, + { + "name": "model.layers.40.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.615211987082148e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006784303113818169, + "sensitivity": 0.5076655225368633 + }, + { + "name": "model.layers.40.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.00066953751957044, + "sensitivity": 0.5981714674928128 + }, + { + "name": "model.layers.40.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.321957014028158e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006598655018024147, + "sensitivity": 0.5150015882052565 + }, + { + "name": "model.layers.40.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.331222539301962e-05, + "sensitivity": 0.6799515348207157 + }, + { + "name": "model.layers.40.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.074733616718731e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007255206583067775, + "sensitivity": 0.5396972447882777 + }, + { + "name": "model.layers.40.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0649231626302935e-05, + "sensitivity": 1.2013060501174786 + }, + { + "name": "model.layers.40.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0657497568899998e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000662231061141938, + "sensitivity": 0.5835230230452935 + }, + { + "name": "model.layers.40.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.335112993838266e-05, + "sensitivity": 0.7985328444484188 + }, + { + "name": "model.layers.40.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.684752745262813e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007147648138925433, + "sensitivity": 0.5268945773934967 + }, + { + "name": "model.layers.40.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.117508019087836e-05, + "sensitivity": 0.9764783717783857 + }, + { + "name": "model.layers.40.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.299889486806933e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006732306210324168, + "sensitivity": 0.5491633004986703 + }, + { + "name": "model.layers.40.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.084538598661311e-05, + "sensitivity": 1.5505420896948876 + }, + { + "name": "model.layers.40.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.115187029034132e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.919762043049559e-05, + "sensitivity": 0.6542507819183647 + }, + { + "name": "model.layers.40.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.77844402869232e-05, + "sensitivity": 0.9222549567135176 + }, + { + "name": "model.layers.40.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.162093440143508e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.095062053645961e-05, + "sensitivity": 0.7993033849261499 + }, + { + "name": "model.layers.40.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.110632911149878e-05, + "sensitivity": 1.233408743851293 + }, + { + "name": "model.layers.40.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.173001333489083e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006887412164360285, + "sensitivity": 0.5169324847930068 + }, + { + "name": "model.layers.40.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.023387686582282e-05, + "sensitivity": 0.973138588350081 + }, + { + "name": "model.layers.40.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.168816197605338e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9194349887548015e-05, + "sensitivity": 0.9698673456943088 + }, + { + "name": "model.layers.40.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8304907724959776e-05, + "sensitivity": 1.088232713463895 + }, + { + "name": "model.layers.40.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.875192065715964e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006586451781913638, + "sensitivity": 0.547035609609048 + }, + { + "name": "model.layers.40.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0197472875006497e-05, + "sensitivity": 1.9635503452387377 + }, + { + "name": "model.layers.40.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.05533104033384e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9086185501655564e-05, + "sensitivity": 0.6715638016350524 + }, + { + "name": "model.layers.40.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.345484871417284e-05, + "sensitivity": 0.6238913693223482 + }, + { + "name": "model.layers.40.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.398666639346629e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007017114548943937, + "sensitivity": 0.5686855698649967 + }, + { + "name": "model.layers.40.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0738589480752125e-05, + "sensitivity": 1.3437427530026567 + }, + { + "name": "model.layers.40.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0372672250014148e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006565612275153399, + "sensitivity": 0.5674978475784388 + }, + { + "name": "model.layers.40.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.086170469643548e-05, + "sensitivity": 1.1473019232934123 + }, + { + "name": "model.layers.40.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.977750442478282e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006583728827536106, + "sensitivity": 0.5298015409645644 + }, + { + "name": "model.layers.40.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.897074152017012e-05, + "sensitivity": 0.7448653256615452 + }, + { + "name": "model.layers.40.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.063354132696986e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7169992942363024e-05, + "sensitivity": 0.6167614521796387 + }, + { + "name": "model.layers.40.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.215028406586498e-05, + "sensitivity": 0.8830384067041195 + }, + { + "name": "model.layers.40.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.519475164168398e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.816719542257488e-05, + "sensitivity": 0.6918792648676715 + }, + { + "name": "model.layers.40.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1313239156152122e-05, + "sensitivity": 1.3245784942565664 + }, + { + "name": "model.layers.40.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1107989621450542e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.305113492999226e-05, + "sensitivity": 0.8795836342420255 + }, + { + "name": "model.layers.40.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.98431724938564e-05, + "sensitivity": 1.097602858849579 + }, + { + "name": "model.layers.40.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.095529213074769e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006672395393252373, + "sensitivity": 0.5781743503029454 + }, + { + "name": "model.layers.40.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.9321329899830744e-05, + "sensitivity": 0.6032475544815349 + }, + { + "name": "model.layers.40.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.072244893104653e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006813372019678354, + "sensitivity": 0.5663149181457351 + }, + { + "name": "model.layers.40.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1659830306598451e-05, + "sensitivity": 1.4777859722793336 + }, + { + "name": "model.layers.40.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.161877869701129e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000699371739756316, + "sensitivity": 0.5844374951503545 + }, + { + "name": "model.layers.40.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0464619663252961e-05, + "sensitivity": 1.3999779194782118 + }, + { + "name": "model.layers.40.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0131960834769416e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9983791288686916e-05, + "sensitivity": 0.6358177653654509 + }, + { + "name": "model.layers.40.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.857922562630847e-05, + "sensitivity": 0.7578005549678414 + }, + { + "name": "model.layers.40.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.861498261263478e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007855623844079673, + "sensitivity": 0.5465149342490281 + }, + { + "name": "model.layers.40.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.212333391886204e-05, + "sensitivity": 1.0647942976089952 + }, + { + "name": "model.layers.40.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.017292205091508e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000696613802574575, + "sensitivity": 0.5248351170523925 + }, + { + "name": "model.layers.40.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.204645615071058e-05, + "sensitivity": 0.6693591780450092 + }, + { + "name": "model.layers.40.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1130546226922888e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007024848600849509, + "sensitivity": 0.5147688075540559 + }, + { + "name": "model.layers.40.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.006411730486434e-05, + "sensitivity": 1.840243065744812 + }, + { + "name": "model.layers.40.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.875451046857052e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.087362999096513e-05, + "sensitivity": 0.8620469024495363 + }, + { + "name": "model.layers.40.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.252165621845052e-05, + "sensitivity": 1.1594864129160005 + }, + { + "name": "model.layers.40.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.97114751094341e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007060301722958684, + "sensitivity": 0.5435561935695498 + }, + { + "name": "model.layers.40.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.21348769729957e-05, + "sensitivity": 0.9036305857699105 + }, + { + "name": "model.layers.40.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0285029929946177e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.771463424433023e-05, + "sensitivity": 0.7056960748806214 + }, + { + "name": "model.layers.40.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.01276260567829e-05, + "sensitivity": 0.6703623224317394 + }, + { + "name": "model.layers.40.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.986882681303541e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006775002693757415, + "sensitivity": 0.5062494810511531 + }, + { + "name": "model.layers.40.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0480437241494656e-05, + "sensitivity": 0.6302591640580998 + }, + { + "name": "model.layers.40.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.253957387045375e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006547748926095665, + "sensitivity": 0.5370552251395093 + }, + { + "name": "model.layers.40.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.777754631708376e-05, + "sensitivity": 0.9732512828712033 + }, + { + "name": "model.layers.40.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0575718079053331e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006484420737251639, + "sensitivity": 0.5519115989116903 + }, + { + "name": "model.layers.40.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.24459789833054e-05, + "sensitivity": 0.7790472219652775 + }, + { + "name": "model.layers.40.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.06054039861192e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007153379265218973, + "sensitivity": 0.5517694204483428 + }, + { + "name": "model.layers.40.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 1.7376695495840977e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.270014647365315e-06, + "sensitivity": 2.1044663463852795 + }, + { + "name": "model.layers.40.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 3.8911248338990845e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.40.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.6376847042920417e-06, + "sensitivity": 2.1060851780085037 + }, + { + "name": "model.layers.40.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 7.248479505506111e-06, + "sensitivity": 2.0740932415548965 + }, + { + "name": "model.layers.40.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00017637867131270468, + "sensitivity": 0.8819618728863331 + }, + { + "name": "model.layers.40.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.3413685337582137e-05, + "sensitivity": 1.9227917845277316 + }, + { + "name": "model.layers.40.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 4.89735793962609e-05, + "sensitivity": 0.6321370544899039 + }, + { + "name": "model.layers.40.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.0002854735357686877, + "sensitivity": 0.9108304140560908 + }, + { + "name": "model.layers.41.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0014215705450624e-05, + "sensitivity": 0.9473154958745369 + }, + { + "name": "model.layers.41.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.368750516434375e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006826412281952798, + "sensitivity": 0.5615932660774531 + }, + { + "name": "model.layers.41.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.985827349126339e-05, + "sensitivity": 0.8677240144072765 + }, + { + "name": "model.layers.41.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.745276656758506e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007958390633575618, + "sensitivity": 0.5958421844649806 + }, + { + "name": "model.layers.41.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.39455538475886e-05, + "sensitivity": 1.030727138647284 + }, + { + "name": "model.layers.41.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.095807970676105e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006919209263287485, + "sensitivity": 0.5394397701037097 + }, + { + "name": "model.layers.41.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006539843743667006, + "sensitivity": 0.5930950856305828 + }, + { + "name": "model.layers.41.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.378641046467237e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006743529811501503, + "sensitivity": 0.5070556522250319 + }, + { + "name": "model.layers.41.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1018101758963894e-05, + "sensitivity": 1.690785281404908 + }, + { + "name": "model.layers.41.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2646893310375162e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.869124652235769e-05, + "sensitivity": 0.6457012682702927 + }, + { + "name": "model.layers.41.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1487334631965496e-05, + "sensitivity": 1.4520926125768334 + }, + { + "name": "model.layers.41.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.35863295631134e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006834515370428562, + "sensitivity": 0.5858834536051551 + }, + { + "name": "model.layers.41.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.694642459275201e-05, + "sensitivity": 0.6613775481780347 + }, + { + "name": "model.layers.41.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.395365173579194e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006464883335866034, + "sensitivity": 0.5899191407678787 + }, + { + "name": "model.layers.41.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.081832543713972e-05, + "sensitivity": 0.6495739971000933 + }, + { + "name": "model.layers.41.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.676117436654749e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006908971117809415, + "sensitivity": 0.5268919054133152 + }, + { + "name": "model.layers.41.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007100695511326194, + "sensitivity": 0.5455223061547589 + }, + { + "name": "model.layers.41.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.603985293120786e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006813002983108163, + "sensitivity": 0.5218952503385224 + }, + { + "name": "model.layers.41.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.736460298066959e-05, + "sensitivity": 0.9049304283695938 + }, + { + "name": "model.layers.41.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.068417400863837e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000680064782500267, + "sensitivity": 0.5767533207514354 + }, + { + "name": "model.layers.41.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.51246082270518e-05, + "sensitivity": 1.178558103472682 + }, + { + "name": "model.layers.41.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1255007166255382e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.405120802810416e-05, + "sensitivity": 0.6288815176326439 + }, + { + "name": "model.layers.41.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007343272445723414, + "sensitivity": 0.547303608179574 + }, + { + "name": "model.layers.41.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.548871275910642e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.37494886177592e-05, + "sensitivity": 0.6119310724390556 + }, + { + "name": "model.layers.41.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.4149921955540776e-06, + "sensitivity": 2.097647856946052 + }, + { + "name": "model.layers.41.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.023821596390917e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9262813010718673e-05, + "sensitivity": 0.6283041249671761 + }, + { + "name": "model.layers.41.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0685648350045085e-05, + "sensitivity": 0.8280685856734893 + }, + { + "name": "model.layers.41.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0769065283966484e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.145599036244676e-05, + "sensitivity": 0.6893037925244163 + }, + { + "name": "model.layers.41.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007029154803603888, + "sensitivity": 0.5749125189940472 + }, + { + "name": "model.layers.41.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.338878387803561e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007004638900980353, + "sensitivity": 0.5196780525900908 + }, + { + "name": "model.layers.41.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.291441241046414e-05, + "sensitivity": 1.0309595490461942 + }, + { + "name": "model.layers.41.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.072036277757434e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007307810592465103, + "sensitivity": 0.5529302208551214 + }, + { + "name": "model.layers.41.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.268854485824704e-05, + "sensitivity": 0.743441305975727 + }, + { + "name": "model.layers.41.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.832466053514509e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006851596990600228, + "sensitivity": 0.5281637750457605 + }, + { + "name": "model.layers.41.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.662749026669189e-05, + "sensitivity": 1.0461958465232477 + }, + { + "name": "model.layers.41.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0508447303436697e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.4691619880031794e-05, + "sensitivity": 0.6473071977545304 + }, + { + "name": "model.layers.41.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.096180732129142e-05, + "sensitivity": 0.8275436160625628 + }, + { + "name": "model.layers.41.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.201231480597926e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007133566541597247, + "sensitivity": 0.5396382758944988 + }, + { + "name": "model.layers.41.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.272321242140606e-05, + "sensitivity": 1.2612463000026595 + }, + { + "name": "model.layers.41.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1521103715494974e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007958944770507514, + "sensitivity": 0.5412189673125579 + }, + { + "name": "model.layers.41.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.376129749696702e-05, + "sensitivity": 0.7163280057743239 + }, + { + "name": "model.layers.41.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.043933459906839e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006823735311627388, + "sensitivity": 0.5477793794954507 + }, + { + "name": "model.layers.41.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000649435562081635, + "sensitivity": 0.5813044986708081 + }, + { + "name": "model.layers.41.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.289839001918153e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006251713493838906, + "sensitivity": 0.5375317399326406 + }, + { + "name": "model.layers.41.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6516757467761636e-05, + "sensitivity": 0.9144496501318945 + }, + { + "name": "model.layers.41.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0250623745378107e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.753510049544275e-05, + "sensitivity": 0.628657909782834 + }, + { + "name": "model.layers.41.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.797897756565362e-05, + "sensitivity": 0.6080857899825619 + }, + { + "name": "model.layers.41.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.753821253369097e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006689359433948994, + "sensitivity": 0.5111914174731089 + }, + { + "name": "model.layers.41.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0735151590779424e-05, + "sensitivity": 1.3112428123900948 + }, + { + "name": "model.layers.41.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0663924285836401e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.217809277586639e-05, + "sensitivity": 0.7217420748556598 + }, + { + "name": "model.layers.41.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.099191523389891e-05, + "sensitivity": 0.9251190141845483 + }, + { + "name": "model.layers.41.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.439097089445568e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007009552791714668, + "sensitivity": 0.5296733226687214 + }, + { + "name": "model.layers.41.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.039080835762434e-05, + "sensitivity": 0.6026787071697873 + }, + { + "name": "model.layers.41.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.023547254902951e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006704982370138168, + "sensitivity": 0.5331517339497778 + }, + { + "name": "model.layers.41.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.894645048305392e-05, + "sensitivity": 0.9725525349363736 + }, + { + "name": "model.layers.41.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.755474366102135e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.599515083711594e-05, + "sensitivity": 0.6496344058506931 + }, + { + "name": "model.layers.41.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1318118595227133e-05, + "sensitivity": 1.3450392601713232 + }, + { + "name": "model.layers.41.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.53812855691649e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.673176540061831e-05, + "sensitivity": 0.7805528750821713 + }, + { + "name": "model.layers.41.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.321809632936493e-05, + "sensitivity": 0.9131967794635586 + }, + { + "name": "model.layers.41.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.147396215463232e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006743567064404488, + "sensitivity": 0.5178554647872098 + }, + { + "name": "model.layers.41.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.450628279708326e-05, + "sensitivity": 0.8405802045532068 + }, + { + "name": "model.layers.41.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0784269761643372e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.156053859740496e-05, + "sensitivity": 0.7676735747236455 + }, + { + "name": "model.layers.41.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.704393308609724e-05, + "sensitivity": 0.8794433583510991 + }, + { + "name": "model.layers.41.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.016059059111285e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.72550086164847e-05, + "sensitivity": 0.6118723014308544 + }, + { + "name": "model.layers.41.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0055794165236875e-05, + "sensitivity": 0.6033871816801845 + }, + { + "name": "model.layers.41.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.964540600369219e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006741037359461188, + "sensitivity": 0.5239293087266806 + }, + { + "name": "model.layers.41.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.859525845153257e-05, + "sensitivity": 0.6390266831767064 + }, + { + "name": "model.layers.41.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.755515412100067e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000645384774543345, + "sensitivity": 0.5556026804527863 + }, + { + "name": "model.layers.41.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.898211384192109e-05, + "sensitivity": 1.118577280586735 + }, + { + "name": "model.layers.41.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1337796195221017e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006751897162757814, + "sensitivity": 0.5446997867065309 + }, + { + "name": "model.layers.41.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.5309807369922055e-06, + "sensitivity": 2.0971843871821463 + }, + { + "name": "model.layers.41.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5883800870142295e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0109596233814955e-05, + "sensitivity": 0.7958065249428495 + }, + { + "name": "model.layers.41.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006735351635143161, + "sensitivity": 0.5540043465878912 + }, + { + "name": "model.layers.41.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.609145088987134e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006709710578434169, + "sensitivity": 0.5456628462388693 + }, + { + "name": "model.layers.41.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.1278413340915e-05, + "sensitivity": 0.7786273927542846 + }, + { + "name": "model.layers.41.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.903718367037072e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006911371601745486, + "sensitivity": 0.580349963398253 + }, + { + "name": "model.layers.41.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.2554593215318164e-06, + "sensitivity": 2.0660453725384755 + }, + { + "name": "model.layers.41.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.142121504926763e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006270328303799033, + "sensitivity": 0.5964012976267243 + }, + { + "name": "model.layers.41.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.412077345885336e-05, + "sensitivity": 0.7659197357327157 + }, + { + "name": "model.layers.41.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.99056146863586e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.307669536909088e-05, + "sensitivity": 0.635609956075893 + }, + { + "name": "model.layers.41.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007079103961586952, + "sensitivity": 0.580946567914994 + }, + { + "name": "model.layers.41.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.63215837196185e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007227996829897165, + "sensitivity": 0.5682448005563207 + }, + { + "name": "model.layers.41.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.135553121566772e-05, + "sensitivity": 0.6469623592317784 + }, + { + "name": "model.layers.41.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.962138172639243e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007010043482296169, + "sensitivity": 0.5273443730831106 + }, + { + "name": "model.layers.41.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.261763337533921e-05, + "sensitivity": 0.7503401429020842 + }, + { + "name": "model.layers.41.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.994830528128659e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007137047359719872, + "sensitivity": 0.5336408190456772 + }, + { + "name": "model.layers.41.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7454322814010084e-05, + "sensitivity": 0.6723554856876358 + }, + { + "name": "model.layers.41.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.52287212687952e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000642994767986238, + "sensitivity": 0.5107356692791247 + }, + { + "name": "model.layers.41.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6050772400340065e-05, + "sensitivity": 0.8837375497344869 + }, + { + "name": "model.layers.41.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.552788924338529e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006891568191349506, + "sensitivity": 0.5985433022683476 + }, + { + "name": "model.layers.41.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1305367479508277e-05, + "sensitivity": 1.2538808216875104 + }, + { + "name": "model.layers.41.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1955032732657855e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006709459121339023, + "sensitivity": 0.576176287293854 + }, + { + "name": "model.layers.41.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.217109638673719e-05, + "sensitivity": 1.2768486252227693 + }, + { + "name": "model.layers.41.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.26046607724129e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007208720780909061, + "sensitivity": 0.5077073710766574 + }, + { + "name": "model.layers.41.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006913035176694393, + "sensitivity": 0.5140819427416049 + }, + { + "name": "model.layers.41.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.046321227084263e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006614301237277687, + "sensitivity": 0.538192485331879 + }, + { + "name": "model.layers.41.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.72855312586762e-05, + "sensitivity": 0.7240514665270148 + }, + { + "name": "model.layers.41.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.198171255775378e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007643825374543667, + "sensitivity": 0.5463410404973734 + }, + { + "name": "model.layers.41.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8245128457201645e-05, + "sensitivity": 0.6328891291984046 + }, + { + "name": "model.layers.41.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.560971428370976e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006481005111709237, + "sensitivity": 0.5617556652009931 + }, + { + "name": "model.layers.41.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.039664731360972e-05, + "sensitivity": 0.7829448572995998 + }, + { + "name": "model.layers.41.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.102524932633969e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006459177238866687, + "sensitivity": 0.5251627198030586 + }, + { + "name": "model.layers.41.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007044441881589592, + "sensitivity": 0.5917143537571611 + }, + { + "name": "model.layers.41.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.23705704533495e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000664009596221149, + "sensitivity": 0.5249463023283387 + }, + { + "name": "model.layers.41.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006909488001838326, + "sensitivity": 0.5589949901260985 + }, + { + "name": "model.layers.41.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.304964810828096e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006838515400886536, + "sensitivity": 0.5198717568074016 + }, + { + "name": "model.layers.41.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.7221430324716493e-05, + "sensitivity": 0.664424028633191 + }, + { + "name": "model.layers.41.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.780475700907118e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006915663834661245, + "sensitivity": 0.5656743861791561 + }, + { + "name": "model.layers.41.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.591388228116557e-05, + "sensitivity": 0.6928039057835625 + }, + { + "name": "model.layers.41.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.569071496822289e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007154032355174422, + "sensitivity": 0.5810094878772014 + }, + { + "name": "model.layers.41.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.478707655332983e-05, + "sensitivity": 0.6569476283161445 + }, + { + "name": "model.layers.41.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.350872692768462e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007135821506381035, + "sensitivity": 0.5381796655413766 + }, + { + "name": "model.layers.41.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.954498192295432e-05, + "sensitivity": 0.6172877902238089 + }, + { + "name": "model.layers.41.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.66999505685817e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006395004456862807, + "sensitivity": 0.539054976939576 + }, + { + "name": "model.layers.41.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.361599662341177e-05, + "sensitivity": 1.0755950337738462 + }, + { + "name": "model.layers.41.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.7849487221610616e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.060549276298843e-05, + "sensitivity": 0.6828571506531207 + }, + { + "name": "model.layers.41.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0684698837576434e-05, + "sensitivity": 0.7683430818284114 + }, + { + "name": "model.layers.41.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.663024916837458e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.22274455963634e-05, + "sensitivity": 0.6007335473080094 + }, + { + "name": "model.layers.41.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.13320547825424e-05, + "sensitivity": 1.959106246380401 + }, + { + "name": "model.layers.41.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5235598311846843e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.874672206118703e-05, + "sensitivity": 0.7587259537372282 + }, + { + "name": "model.layers.41.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.6269516790052876e-05, + "sensitivity": 0.7978794170571842 + }, + { + "name": "model.layers.41.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0523762057346175e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00063088140450418, + "sensitivity": 0.5687902267250491 + }, + { + "name": "model.layers.41.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.26073160674423e-05, + "sensitivity": 0.9419534160888454 + }, + { + "name": "model.layers.41.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.457751394213119e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007397853769361973, + "sensitivity": 0.5399738374944919 + }, + { + "name": "model.layers.41.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.518992449855432e-05, + "sensitivity": 0.7480016361348932 + }, + { + "name": "model.layers.41.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.433432299170818e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.44297688268125e-05, + "sensitivity": 0.6198039728546172 + }, + { + "name": "model.layers.41.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.26630790065974e-05, + "sensitivity": 0.9781163455208365 + }, + { + "name": "model.layers.41.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.155002089755726e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006989313988015056, + "sensitivity": 0.5702501135014564 + }, + { + "name": "model.layers.41.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 1.6158246580744162e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.823588602041127e-06, + "sensitivity": 2.1046306987645313 + }, + { + "name": "model.layers.41.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.070756858709501e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.41.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.6009091723390156e-06, + "sensitivity": 2.105183120959502 + }, + { + "name": "model.layers.41.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 1.136887749453308e-05, + "sensitivity": 2.2299636904771125 + }, + { + "name": "model.layers.41.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00016693651559762657, + "sensitivity": 0.7437160278456537 + }, + { + "name": "model.layers.41.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.937441629706882e-05, + "sensitivity": 0.8174296001364302 + }, + { + "name": "model.layers.41.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 4.936152254231274e-05, + "sensitivity": 0.8506519673861413 + }, + { + "name": "model.layers.41.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00021875753009226173, + "sensitivity": 0.7663255807388758 + }, + { + "name": "model.layers.42.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.841529855388217e-05, + "sensitivity": 0.7957119149922822 + }, + { + "name": "model.layers.42.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.555017186357873e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.7836685300571844e-05, + "sensitivity": 0.7802066550944822 + }, + { + "name": "model.layers.42.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0857602319447324e-05, + "sensitivity": 1.3231470746963065 + }, + { + "name": "model.layers.42.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1364725196472136e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006856260588392615, + "sensitivity": 0.5900897995729383 + }, + { + "name": "model.layers.42.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.515988206956536e-05, + "sensitivity": 0.7260876352241864 + }, + { + "name": "model.layers.42.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.886656021582894e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007187202572822571, + "sensitivity": 0.5528980650929015 + }, + { + "name": "model.layers.42.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007666065357625484, + "sensitivity": 0.528838097454211 + }, + { + "name": "model.layers.42.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.216026460810099e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007471974822692573, + "sensitivity": 0.5441465076639755 + }, + { + "name": "model.layers.42.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007185963913798332, + "sensitivity": 0.5881133615464419 + }, + { + "name": "model.layers.42.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.703962066647364e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006633991142734885, + "sensitivity": 0.5642161365858734 + }, + { + "name": "model.layers.42.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.29062342341058e-05, + "sensitivity": 0.8787289554209534 + }, + { + "name": "model.layers.42.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.932016382663278e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006909994408488274, + "sensitivity": 0.5659151947853597 + }, + { + "name": "model.layers.42.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.227577978279442e-05, + "sensitivity": 0.7354239753439784 + }, + { + "name": "model.layers.42.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.309768529419671e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006665278924629092, + "sensitivity": 0.5279137781564828 + }, + { + "name": "model.layers.42.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000695937080308795, + "sensitivity": 0.5855078362591475 + }, + { + "name": "model.layers.42.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.517912194998644e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006879447028040886, + "sensitivity": 0.5472404529116469 + }, + { + "name": "model.layers.42.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.414746167138219e-05, + "sensitivity": 0.7043633264119538 + }, + { + "name": "model.layers.42.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.343247029391932e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000697073875926435, + "sensitivity": 0.5283186240394318 + }, + { + "name": "model.layers.42.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.477203714894131e-05, + "sensitivity": 1.018397678928106 + }, + { + "name": "model.layers.42.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 3.3711173728079302e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.004391980241053e-05, + "sensitivity": 0.6946895831136989 + }, + { + "name": "model.layers.42.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.662727926392108e-05, + "sensitivity": 0.8394184996414573 + }, + { + "name": "model.layers.42.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.251550530578243e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.905995931243524e-05, + "sensitivity": 0.9166191446612414 + }, + { + "name": "model.layers.42.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.421824946301058e-05, + "sensitivity": 0.7456914367254829 + }, + { + "name": "model.layers.42.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.834805953483738e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0432001191657037e-05, + "sensitivity": 0.6555380290921038 + }, + { + "name": "model.layers.42.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.257584027480334e-05, + "sensitivity": 0.6107202071242017 + }, + { + "name": "model.layers.42.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.339013106706261e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006481194868683815, + "sensitivity": 0.5281825312463373 + }, + { + "name": "model.layers.42.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.959944585105404e-05, + "sensitivity": 0.6704017326974941 + }, + { + "name": "model.layers.42.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.895680482761236e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.001499034231529e-05, + "sensitivity": 0.6582125270723204 + }, + { + "name": "model.layers.42.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.36108306935057e-05, + "sensitivity": 0.9112478715317222 + }, + { + "name": "model.layers.42.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.492514436715282e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007152113830670714, + "sensitivity": 0.548880267424116 + }, + { + "name": "model.layers.42.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.6466185671743e-05, + "sensitivity": 0.9620782011697538 + }, + { + "name": "model.layers.42.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2219447853567544e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007017725147306919, + "sensitivity": 0.5701031565689625 + }, + { + "name": "model.layers.42.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0786619895952754e-05, + "sensitivity": 1.6370386748362917 + }, + { + "name": "model.layers.42.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.470371426483325e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.329223106149584e-05, + "sensitivity": 0.8766514063870581 + }, + { + "name": "model.layers.42.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.0390433999418747e-05, + "sensitivity": 1.8971330840274092 + }, + { + "name": "model.layers.42.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.385707251865824e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000717572052963078, + "sensitivity": 0.524005473573515 + }, + { + "name": "model.layers.42.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000722483906429261, + "sensitivity": 0.5358038064562543 + }, + { + "name": "model.layers.42.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.17668592389964e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007184402784332633, + "sensitivity": 0.5431193168381769 + }, + { + "name": "model.layers.42.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.912224150961265e-05, + "sensitivity": 0.8943963056026272 + }, + { + "name": "model.layers.42.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1317815733491443e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.064596527721733e-05, + "sensitivity": 0.7890594121277295 + }, + { + "name": "model.layers.42.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.321022374322638e-05, + "sensitivity": 0.791861954959914 + }, + { + "name": "model.layers.42.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.61006469676795e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006844158633612096, + "sensitivity": 0.5198531686652696 + }, + { + "name": "model.layers.42.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.351924093905836e-05, + "sensitivity": 0.7490292203066264 + }, + { + "name": "model.layers.42.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.64012180903228e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.877725197933614e-05, + "sensitivity": 0.6816939039419588 + }, + { + "name": "model.layers.42.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006681570084765553, + "sensitivity": 0.5636357173950649 + }, + { + "name": "model.layers.42.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.415692605012737e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006219518836587667, + "sensitivity": 0.5466696186482577 + }, + { + "name": "model.layers.42.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.152949936222285e-05, + "sensitivity": 0.8327871896078628 + }, + { + "name": "model.layers.42.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.41454379951756e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006963221239857376, + "sensitivity": 0.5191804995441407 + }, + { + "name": "model.layers.42.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007689629564993083, + "sensitivity": 0.5384276379838014 + }, + { + "name": "model.layers.42.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.824048111615411e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.017911411821842e-05, + "sensitivity": 0.6959803595228109 + }, + { + "name": "model.layers.42.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006938354927115142, + "sensitivity": 0.5403219622669397 + }, + { + "name": "model.layers.42.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.55552150621952e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.961046554148197e-05, + "sensitivity": 0.6019468899995257 + }, + { + "name": "model.layers.42.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.305998977040872e-05, + "sensitivity": 0.7273146669004641 + }, + { + "name": "model.layers.42.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.22104788969591e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.33803938399069e-05, + "sensitivity": 0.7113421617490936 + }, + { + "name": "model.layers.42.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007721766596660018, + "sensitivity": 0.5969072642026748 + }, + { + "name": "model.layers.42.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.15213411442528e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00076205690857023, + "sensitivity": 0.5359761694038155 + }, + { + "name": "model.layers.42.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.164881051518023e-05, + "sensitivity": 0.6638906004262348 + }, + { + "name": "model.layers.42.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.972930688993074e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006960458122193813, + "sensitivity": 0.5242914073032128 + }, + { + "name": "model.layers.42.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006955303251743317, + "sensitivity": 0.5436855737811525 + }, + { + "name": "model.layers.42.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.134125326047069e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006508738733828068, + "sensitivity": 0.5575961127733322 + }, + { + "name": "model.layers.42.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007137075299397111, + "sensitivity": 0.547972069363834 + }, + { + "name": "model.layers.42.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.795737815285975e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000734523287974298, + "sensitivity": 0.5627470176692915 + }, + { + "name": "model.layers.42.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.823950777994469e-05, + "sensitivity": 0.8258675677818186 + }, + { + "name": "model.layers.42.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.826755563655752e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006011682562530041, + "sensitivity": 0.5549504582609434 + }, + { + "name": "model.layers.42.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.605713133467361e-05, + "sensitivity": 0.7247001641381936 + }, + { + "name": "model.layers.42.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.078006317191466e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007018343894742429, + "sensitivity": 0.5425029258117264 + }, + { + "name": "model.layers.42.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.037659113644622e-05, + "sensitivity": 0.6013140849024605 + }, + { + "name": "model.layers.42.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.684772521723062e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006402776343747973, + "sensitivity": 0.5639058525594804 + }, + { + "name": "model.layers.42.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.265392585191876e-05, + "sensitivity": 0.69808798491704 + }, + { + "name": "model.layers.42.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.525641419510066e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006855819374322891, + "sensitivity": 0.5636779892336032 + }, + { + "name": "model.layers.42.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.000485154800117e-05, + "sensitivity": 0.8315855166128107 + }, + { + "name": "model.layers.42.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.46968079409271e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.875012720935047e-05, + "sensitivity": 0.7898663136928536 + }, + { + "name": "model.layers.42.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.211718573467806e-05, + "sensitivity": 0.9524992934922878 + }, + { + "name": "model.layers.42.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.573803501742077e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.97207433404401e-05, + "sensitivity": 0.7449550418513916 + }, + { + "name": "model.layers.42.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007294550305232406, + "sensitivity": 0.5863101894099255 + }, + { + "name": "model.layers.42.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.512640192748222e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.1832709787995555e-05, + "sensitivity": 1.2076650356964242 + }, + { + "name": "model.layers.42.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.461658631451428e-05, + "sensitivity": 0.8718683314746938 + }, + { + "name": "model.layers.42.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.115264694817597e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.653965101577342e-05, + "sensitivity": 0.7542416297560929 + }, + { + "name": "model.layers.42.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006800342234782875, + "sensitivity": 0.5562639367676248 + }, + { + "name": "model.layers.42.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.51461777529039e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006344640860334039, + "sensitivity": 0.5823763621259959 + }, + { + "name": "model.layers.42.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.914940604474396e-05, + "sensitivity": 0.6028626362736123 + }, + { + "name": "model.layers.42.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.888129402999766e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00078191002830863, + "sensitivity": 0.5469874649809215 + }, + { + "name": "model.layers.42.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.935208173468709e-05, + "sensitivity": 0.9576644442246535 + }, + { + "name": "model.layers.42.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.246539214771474e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.67234746995382e-05, + "sensitivity": 0.8384764383667201 + }, + { + "name": "model.layers.42.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.27351037110202e-05, + "sensitivity": 0.7415633994582423 + }, + { + "name": "model.layers.42.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.747560625328333e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006950628012418747, + "sensitivity": 0.5781572522599896 + }, + { + "name": "model.layers.42.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.437484989874065e-05, + "sensitivity": 1.0622152745182751 + }, + { + "name": "model.layers.42.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.007466132970876e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000747651734855026, + "sensitivity": 0.5723989061936089 + }, + { + "name": "model.layers.42.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0876183852087706e-05, + "sensitivity": 1.0757531109824379 + }, + { + "name": "model.layers.42.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.392846456838015e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006803018040955067, + "sensitivity": 0.5555293420253357 + }, + { + "name": "model.layers.42.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.892054468858987e-05, + "sensitivity": 0.6553367277566738 + }, + { + "name": "model.layers.42.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.074842756082944e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006392718642018735, + "sensitivity": 0.555718772971481 + }, + { + "name": "model.layers.42.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007037587347440422, + "sensitivity": 0.5508363463536361 + }, + { + "name": "model.layers.42.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.800029268561048e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.00070993322879076, + "sensitivity": 0.5593918525934858 + }, + { + "name": "model.layers.42.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.81035201321356e-05, + "sensitivity": 0.7469523656929645 + }, + { + "name": "model.layers.42.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.845213758628233e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.007660340401344e-05, + "sensitivity": 0.6041161713793266 + }, + { + "name": "model.layers.42.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.583704089280218e-05, + "sensitivity": 0.618624454217352 + }, + { + "name": "model.layers.42.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.799437066249084e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007455744780600071, + "sensitivity": 0.5349158236653042 + }, + { + "name": "model.layers.42.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006808197940699756, + "sensitivity": 0.5590007216263808 + }, + { + "name": "model.layers.42.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.248711083069793e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006570323603227735, + "sensitivity": 0.540613283934085 + }, + { + "name": "model.layers.42.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.975081512588076e-05, + "sensitivity": 0.8079915376673483 + }, + { + "name": "model.layers.42.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.318592108480516e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006532830884680152, + "sensitivity": 0.5334090483291635 + }, + { + "name": "model.layers.42.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.505313674802892e-05, + "sensitivity": 0.9799445703558334 + }, + { + "name": "model.layers.42.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.309932132353424e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006458432762883604, + "sensitivity": 0.580839833936684 + }, + { + "name": "model.layers.42.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.878613592358306e-05, + "sensitivity": 0.7419170973464261 + }, + { + "name": "model.layers.42.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.115983748917643e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006737703224644065, + "sensitivity": 0.5604943083925737 + }, + { + "name": "model.layers.42.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.76925337756984e-05, + "sensitivity": 0.8186792980416899 + }, + { + "name": "model.layers.42.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.989331945485901e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.710251909680665e-05, + "sensitivity": 0.6302750791354621 + }, + { + "name": "model.layers.42.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006861516740173101, + "sensitivity": 0.5381081705944548 + }, + { + "name": "model.layers.42.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.46274202154018e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006747896550223231, + "sensitivity": 0.528479439052234 + }, + { + "name": "model.layers.42.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.633331602439284e-05, + "sensitivity": 0.8561472585214235 + }, + { + "name": "model.layers.42.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0717322993514244e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.697547385352664e-05, + "sensitivity": 0.6197759407107952 + }, + { + "name": "model.layers.42.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.120010220911354e-05, + "sensitivity": 0.6490091656429997 + }, + { + "name": "model.layers.42.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.989336043261574e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006675642216578126, + "sensitivity": 0.5446076036128218 + }, + { + "name": "model.layers.42.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.913885590620339e-05, + "sensitivity": 0.7692744737317054 + }, + { + "name": "model.layers.42.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0495098194951424e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008000998641364276, + "sensitivity": 0.5463566442848038 + }, + { + "name": "model.layers.42.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.140126788523048e-05, + "sensitivity": 0.7101571550729641 + }, + { + "name": "model.layers.42.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1133117823192151e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006962978513911366, + "sensitivity": 0.5464407792875435 + }, + { + "name": "model.layers.42.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006499738665297627, + "sensitivity": 0.538278870914285 + }, + { + "name": "model.layers.42.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.978722240091884e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006463453755713999, + "sensitivity": 0.5414925734759536 + }, + { + "name": "model.layers.42.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006826870958320796, + "sensitivity": 0.5134715668987958 + }, + { + "name": "model.layers.42.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.437837439283612e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006878517451696098, + "sensitivity": 0.5251434920696814 + }, + { + "name": "model.layers.42.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.399252015398815e-05, + "sensitivity": 0.6742922180024105 + }, + { + "name": "model.layers.42.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.152152647904586e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.04131564614363e-05, + "sensitivity": 0.6052462072394693 + }, + { + "name": "model.layers.42.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000702015298884362, + "sensitivity": 0.5505028175948089 + }, + { + "name": "model.layers.42.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.06265313460608e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.241867959033698e-05, + "sensitivity": 0.6591178680131635 + }, + { + "name": "model.layers.42.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007171110482886434, + "sensitivity": 0.5435028697729273 + }, + { + "name": "model.layers.42.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.384289114677813e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.256959022721276e-05, + "sensitivity": 0.60003609787317 + }, + { + "name": "model.layers.42.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 1.5517931615249836e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.920926933962619e-06, + "sensitivity": 2.106015007032067 + }, + { + "name": "model.layers.42.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.417030140757561e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.42.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.9301337488286663e-06, + "sensitivity": 2.1098198081230874 + }, + { + "name": "model.layers.42.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 1.132014313043328e-05, + "sensitivity": 2.2457080895309347 + }, + { + "name": "model.layers.42.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.0002176280686398968, + "sensitivity": 0.793304873611195 + }, + { + "name": "model.layers.42.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.952105048985686e-05, + "sensitivity": 0.8953795962904546 + }, + { + "name": "model.layers.42.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 4.385049032862298e-05, + "sensitivity": 0.7625087755739327 + }, + { + "name": "model.layers.42.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 4, + "mse": 5.0670485506998375e-05, + "sensitivity": 1.3972905042165102 + }, + { + "name": "model.layers.43.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007602049736306071, + "sensitivity": 0.5464695601897201 + }, + { + "name": "model.layers.43.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.337433428096119e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007353726541623473, + "sensitivity": 0.5030598040757807 + }, + { + "name": "model.layers.43.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.06094254180789e-05, + "sensitivity": 0.7536802149272124 + }, + { + "name": "model.layers.43.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.38350706797064e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006896990234963596, + "sensitivity": 0.5193550616101942 + }, + { + "name": "model.layers.43.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007068581762723625, + "sensitivity": 0.5602133947865361 + }, + { + "name": "model.layers.43.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.9241302703158e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000701389042660594, + "sensitivity": 0.5321533061889326 + }, + { + "name": "model.layers.43.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.807704630773515e-05, + "sensitivity": 0.7223615614118086 + }, + { + "name": "model.layers.43.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.157438742273371e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007702443981543183, + "sensitivity": 0.5676283462769451 + }, + { + "name": "model.layers.43.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007090584840625525, + "sensitivity": 0.5413746051935067 + }, + { + "name": "model.layers.43.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.687174274906283e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.915791552979499e-05, + "sensitivity": 0.6041257305783041 + }, + { + "name": "model.layers.43.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.254221079871058e-05, + "sensitivity": 1.0066315656993803 + }, + { + "name": "model.layers.43.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.186231070794747e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006527038640342653, + "sensitivity": 0.5475471419099096 + }, + { + "name": "model.layers.43.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007160776294767857, + "sensitivity": 0.5363701662060172 + }, + { + "name": "model.layers.43.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.08540812361025e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007149602752178907, + "sensitivity": 0.5257473111849387 + }, + { + "name": "model.layers.43.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.467907223850489e-05, + "sensitivity": 0.8963638060860218 + }, + { + "name": "model.layers.43.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1171466667292407e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006646484835073352, + "sensitivity": 0.5481306627950793 + }, + { + "name": "model.layers.43.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.538357411045581e-05, + "sensitivity": 0.6059388669614247 + }, + { + "name": "model.layers.43.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.766763587824244e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007532999152317643, + "sensitivity": 0.5926591539709923 + }, + { + "name": "model.layers.43.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.741487595718354e-05, + "sensitivity": 0.6257929823890587 + }, + { + "name": "model.layers.43.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.533026516488462e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007453775033354759, + "sensitivity": 0.5379135006676337 + }, + { + "name": "model.layers.43.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.10342831350863e-05, + "sensitivity": 0.6558643182353636 + }, + { + "name": "model.layers.43.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1285287655482534e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.17396435700357e-05, + "sensitivity": 0.6386070806799791 + }, + { + "name": "model.layers.43.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.862269947305322e-05, + "sensitivity": 0.9213451491653574 + }, + { + "name": "model.layers.43.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.445901246683206e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007488647825084627, + "sensitivity": 0.5537965448976867 + }, + { + "name": "model.layers.43.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.161590863484889e-05, + "sensitivity": 0.9972387017984927 + }, + { + "name": "model.layers.43.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.472339002059016e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006629893905483186, + "sensitivity": 0.5376378700670619 + }, + { + "name": "model.layers.43.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007105680997483432, + "sensitivity": 0.5653131069497036 + }, + { + "name": "model.layers.43.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.97127427176747e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007281664293259382, + "sensitivity": 0.550759062377212 + }, + { + "name": "model.layers.43.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006981519982218742, + "sensitivity": 0.5604057494663626 + }, + { + "name": "model.layers.43.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.401133868574107e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006430709036067128, + "sensitivity": 0.5242284841051603 + }, + { + "name": "model.layers.43.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1568177797016688e-05, + "sensitivity": 1.368843722965875 + }, + { + "name": "model.layers.43.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0594793593554641e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.30366412224248e-05, + "sensitivity": 0.8832817933457103 + }, + { + "name": "model.layers.43.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007135483319871128, + "sensitivity": 0.5793563839924372 + }, + { + "name": "model.layers.43.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5430555322382133e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.6403452617814764e-05, + "sensitivity": 0.6305334829982305 + }, + { + "name": "model.layers.43.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.449005741160363e-05, + "sensitivity": 0.7602857496220393 + }, + { + "name": "model.layers.43.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.3833094928704668e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.8849436754826456e-05, + "sensitivity": 0.6839798995671371 + }, + { + "name": "model.layers.43.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007157976506277919, + "sensitivity": 0.5644498181291174 + }, + { + "name": "model.layers.43.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.924401757009036e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007478293846361339, + "sensitivity": 0.5141644954489499 + }, + { + "name": "model.layers.43.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.356634548865259e-05, + "sensitivity": 1.0135940340382508 + }, + { + "name": "model.layers.43.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.50205992719566e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.630555435549468e-05, + "sensitivity": 1.0000241133330823 + }, + { + "name": "model.layers.43.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007199060055427253, + "sensitivity": 0.5133961017423346 + }, + { + "name": "model.layers.43.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.769479909962683e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007056538015604019, + "sensitivity": 0.5156803968734944 + }, + { + "name": "model.layers.43.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.446917541325092e-05, + "sensitivity": 0.6237774514059087 + }, + { + "name": "model.layers.43.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.29873897600919e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007185357389971614, + "sensitivity": 0.55331479741186 + }, + { + "name": "model.layers.43.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007423778297379613, + "sensitivity": 0.5525429887297905 + }, + { + "name": "model.layers.43.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.333818186656572e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.267482240218669e-05, + "sensitivity": 0.6626891424340376 + }, + { + "name": "model.layers.43.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.289585144259036e-05, + "sensitivity": 0.8619085733716331 + }, + { + "name": "model.layers.43.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0510084393899888e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007167309522628784, + "sensitivity": 0.5487098095314373 + }, + { + "name": "model.layers.43.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007487088441848755, + "sensitivity": 0.5273298041748221 + }, + { + "name": "model.layers.43.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.974442380349501e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007033213041722775, + "sensitivity": 0.56133777505148 + }, + { + "name": "model.layers.43.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.918281724210829e-05, + "sensitivity": 0.9371596289247276 + }, + { + "name": "model.layers.43.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.176014827971812e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007960271905176342, + "sensitivity": 0.5845027696843041 + }, + { + "name": "model.layers.43.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.557175220223144e-05, + "sensitivity": 0.977231869711168 + }, + { + "name": "model.layers.43.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0550286333455006e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007197223603725433, + "sensitivity": 0.5806954006599391 + }, + { + "name": "model.layers.43.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.395734817488119e-05, + "sensitivity": 0.6771258165153251 + }, + { + "name": "model.layers.43.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.752344342610741e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007044849917292595, + "sensitivity": 0.5337903101258101 + }, + { + "name": "model.layers.43.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.672403105767444e-05, + "sensitivity": 0.6863695297004222 + }, + { + "name": "model.layers.43.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.103785719664302e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007481633219867945, + "sensitivity": 0.5669404839287818 + }, + { + "name": "model.layers.43.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.53538154438138e-05, + "sensitivity": 0.8721769667000383 + }, + { + "name": "model.layers.43.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.656571364757838e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007436113664880395, + "sensitivity": 0.5354187274845696 + }, + { + "name": "model.layers.43.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1031595022359397e-05, + "sensitivity": 1.2329938096450408 + }, + { + "name": "model.layers.43.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2726829936582362e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5851705837994814e-05, + "sensitivity": 0.9368064274905104 + }, + { + "name": "model.layers.43.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.8756872022058815e-05, + "sensitivity": 0.760092770990358 + }, + { + "name": "model.layers.43.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.380410238511104e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006733516929671168, + "sensitivity": 0.5587930697067868 + }, + { + "name": "model.layers.43.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.370192568283528e-05, + "sensitivity": 0.665298239345866 + }, + { + "name": "model.layers.43.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.083666441256355e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006640083156526089, + "sensitivity": 0.5822587982449973 + }, + { + "name": "model.layers.43.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.089695307309739e-05, + "sensitivity": 0.7528875012174574 + }, + { + "name": "model.layers.43.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.079621238721302e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006406238535419106, + "sensitivity": 0.5239892271278668 + }, + { + "name": "model.layers.43.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007680892013013363, + "sensitivity": 0.5543853898771702 + }, + { + "name": "model.layers.43.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.038042551561375e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007518132915720344, + "sensitivity": 0.5432214482838585 + }, + { + "name": "model.layers.43.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.898112431168556e-05, + "sensitivity": 0.6077859135103809 + }, + { + "name": "model.layers.43.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.517292033298872e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006474503315985203, + "sensitivity": 0.542046016694562 + }, + { + "name": "model.layers.43.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.130761903477833e-05, + "sensitivity": 0.6749887462028362 + }, + { + "name": "model.layers.43.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.376518169621704e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006975022843107581, + "sensitivity": 0.5608508737946268 + }, + { + "name": "model.layers.43.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.67184212943539e-05, + "sensitivity": 0.9606530548764715 + }, + { + "name": "model.layers.43.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0551210607445682e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.722871330566704e-05, + "sensitivity": 0.6360530259105807 + }, + { + "name": "model.layers.43.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.94753834977746e-05, + "sensitivity": 0.6452400470852713 + }, + { + "name": "model.layers.43.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.9766118687985e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007584846462123096, + "sensitivity": 0.5780167030969342 + }, + { + "name": "model.layers.43.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.949484693701379e-05, + "sensitivity": 0.614501102444877 + }, + { + "name": "model.layers.43.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1742238257284043e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.190763087943196e-05, + "sensitivity": 0.7541452833791258 + }, + { + "name": "model.layers.43.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.644753739237785e-05, + "sensitivity": 0.7484106990285906 + }, + { + "name": "model.layers.43.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.796037829801207e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007211086340248585, + "sensitivity": 0.5492890827850987 + }, + { + "name": "model.layers.43.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.0088332247687504e-05, + "sensitivity": 0.8724219081115563 + }, + { + "name": "model.layers.43.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.704984798489022e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.9934693126706406e-05, + "sensitivity": 0.6958862903906574 + }, + { + "name": "model.layers.43.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.563553324667737e-05, + "sensitivity": 0.666849751617395 + }, + { + "name": "model.layers.43.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4452897403316456e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007203572895377874, + "sensitivity": 0.5886464198280477 + }, + { + "name": "model.layers.43.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007292439695447683, + "sensitivity": 0.5598409669710303 + }, + { + "name": "model.layers.43.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.565109854112961e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006779240211471915, + "sensitivity": 0.5586268013533522 + }, + { + "name": "model.layers.43.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.347454473143443e-05, + "sensitivity": 0.677598079556423 + }, + { + "name": "model.layers.43.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.626396604289766e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.47109845886007e-05, + "sensitivity": 0.8458524243818664 + }, + { + "name": "model.layers.43.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006744525162503123, + "sensitivity": 0.5378248049130053 + }, + { + "name": "model.layers.43.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.473017262782378e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006802569841966033, + "sensitivity": 0.54822643097021 + }, + { + "name": "model.layers.43.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.900752148590982e-05, + "sensitivity": 0.8534019043796697 + }, + { + "name": "model.layers.43.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.323776571865892e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006593801081180573, + "sensitivity": 0.5697479580638655 + }, + { + "name": "model.layers.43.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.608199328184128e-05, + "sensitivity": 0.6235961677281738 + }, + { + "name": "model.layers.43.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.617358844276168e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000712305773049593, + "sensitivity": 0.5749446144309999 + }, + { + "name": "model.layers.43.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007140818051993847, + "sensitivity": 0.5451863119884042 + }, + { + "name": "model.layers.43.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.106591735668189e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006562676280736923, + "sensitivity": 0.5290953336154 + }, + { + "name": "model.layers.43.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006725781131535769, + "sensitivity": 0.5294181122957213 + }, + { + "name": "model.layers.43.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.401941269970848e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006057674763724208, + "sensitivity": 0.5383045994928395 + }, + { + "name": "model.layers.43.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007404013886116445, + "sensitivity": 0.573422582499427 + }, + { + "name": "model.layers.43.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.434894536752836e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006949108792468905, + "sensitivity": 0.5230779957151239 + }, + { + "name": "model.layers.43.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007323437603190541, + "sensitivity": 0.555107056432431 + }, + { + "name": "model.layers.43.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.726052331236133e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006916522397659719, + "sensitivity": 0.5310334142519224 + }, + { + "name": "model.layers.43.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.631897849729285e-05, + "sensitivity": 0.8954178522868191 + }, + { + "name": "model.layers.43.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.006475920614321e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.788840983062983e-05, + "sensitivity": 0.6576159871176783 + }, + { + "name": "model.layers.43.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.4978074331302196e-05, + "sensitivity": 0.7324365225999765 + }, + { + "name": "model.layers.43.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.090043479569431e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.5197328038048e-05, + "sensitivity": 0.7332859313985554 + }, + { + "name": "model.layers.43.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000706388265825808, + "sensitivity": 0.5852038501196448 + }, + { + "name": "model.layers.43.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.316391474887496e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000722581404261291, + "sensitivity": 0.5585825295713616 + }, + { + "name": "model.layers.43.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.362442945828661e-05, + "sensitivity": 0.7305398921976136 + }, + { + "name": "model.layers.43.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 6.733836812600202e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006913202814757824, + "sensitivity": 0.5271714962386383 + }, + { + "name": "model.layers.43.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.350209878291935e-05, + "sensitivity": 0.87788511650309 + }, + { + "name": "model.layers.43.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.174170847662026e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006966536748223007, + "sensitivity": 0.5218709503987016 + }, + { + "name": "model.layers.43.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000765431672334671, + "sensitivity": 0.5334983724962531 + }, + { + "name": "model.layers.43.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.464427653758321e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007559815421700478, + "sensitivity": 0.5192682092150792 + }, + { + "name": "model.layers.43.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.75679839332588e-05, + "sensitivity": 0.7006577170516504 + }, + { + "name": "model.layers.43.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.118143018175033e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.555086292792112e-05, + "sensitivity": 0.6240497560298713 + }, + { + "name": "model.layers.43.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006942005711607635, + "sensitivity": 0.5420111151428778 + }, + { + "name": "model.layers.43.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.888038453529589e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006458614952862263, + "sensitivity": 0.5297045682315391 + }, + { + "name": "model.layers.43.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.3777238311595283e-06, + "sensitivity": 2.097584030602833 + }, + { + "name": "model.layers.43.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.569267831466277e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006334905629046261, + "sensitivity": 0.563786487693265 + }, + { + "name": "model.layers.43.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.464107718784362e-05, + "sensitivity": 0.638451447858533 + }, + { + "name": "model.layers.43.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.205649351111788e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.2693803000729531e-05, + "sensitivity": 1.6068223093561085 + }, + { + "name": "model.layers.43.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 5.739050538977608e-05, + "sensitivity": 0.7349403502664091 + }, + { + "name": "model.layers.43.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.775734497452504e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.775667887064628e-05, + "sensitivity": 0.7023051144554664 + }, + { + "name": "model.layers.43.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000741225085221231, + "sensitivity": 0.556129578364327 + }, + { + "name": "model.layers.43.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.10547612420487e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007108502904884517, + "sensitivity": 0.5593631462931187 + }, + { + "name": "model.layers.43.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 1.506847752352769e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.968503738680738e-06, + "sensitivity": 2.106978125585001 + }, + { + "name": "model.layers.43.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.185621037322562e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.43.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.6698617173460661e-06, + "sensitivity": 2.1092339103152766 + }, + { + "name": "model.layers.43.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 1.0488554835319519e-05, + "sensitivity": 2.202904940453286 + }, + { + "name": "model.layers.43.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00016809572116471827, + "sensitivity": 0.8038724217385219 + }, + { + "name": "model.layers.43.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.555923154228367e-05, + "sensitivity": 0.9683457971495986 + }, + { + "name": "model.layers.43.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 5.392429739004001e-05, + "sensitivity": 0.668693971450738 + }, + { + "name": "model.layers.43.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00025356863625347614, + "sensitivity": 1.009493891432195 + }, + { + "name": "model.layers.44.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.721816316712648e-05, + "sensitivity": 0.6505045782807755 + }, + { + "name": "model.layers.44.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1029678717022762e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007438661414198577, + "sensitivity": 0.5528240209637193 + }, + { + "name": "model.layers.44.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007144473493099213, + "sensitivity": 0.5701729083047802 + }, + { + "name": "model.layers.44.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.028917702380568e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006599724292755127, + "sensitivity": 0.5508535517750209 + }, + { + "name": "model.layers.44.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.275554187595844e-05, + "sensitivity": 0.7965469779046492 + }, + { + "name": "model.layers.44.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2340412922640098e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006909950170665979, + "sensitivity": 0.5429912236380408 + }, + { + "name": "model.layers.44.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.396927346941084e-05, + "sensitivity": 0.8464221986356608 + }, + { + "name": "model.layers.44.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0305855084880022e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.227615813259035e-05, + "sensitivity": 0.6994166848156405 + }, + { + "name": "model.layers.44.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.244799053296447e-05, + "sensitivity": 0.6328697845871003 + }, + { + "name": "model.layers.44.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0389820772616076e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007791281677782536, + "sensitivity": 0.5419851668230082 + }, + { + "name": "model.layers.44.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.718221993651241e-05, + "sensitivity": 0.6893933567250712 + }, + { + "name": "model.layers.44.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.825123490561964e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.26677501713857e-05, + "sensitivity": 0.6942670243191869 + }, + { + "name": "model.layers.44.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.690894952043891e-05, + "sensitivity": 0.6421432807357237 + }, + { + "name": "model.layers.44.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.83415930022602e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.585029041161761e-05, + "sensitivity": 0.7138820151704328 + }, + { + "name": "model.layers.44.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.131193367764354e-05, + "sensitivity": 0.8956350050427091 + }, + { + "name": "model.layers.44.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.938841690702247e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.374392978614196e-05, + "sensitivity": 0.7058329270962431 + }, + { + "name": "model.layers.44.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.62103047943674e-05, + "sensitivity": 0.6780547557006654 + }, + { + "name": "model.layers.44.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0438496929054963e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007035140879452229, + "sensitivity": 0.545724195044324 + }, + { + "name": "model.layers.44.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.296667172340676e-05, + "sensitivity": 0.6396863835826716 + }, + { + "name": "model.layers.44.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3356568615563447e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.750059012323618e-05, + "sensitivity": 0.7308081306298588 + }, + { + "name": "model.layers.44.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007417883607558906, + "sensitivity": 0.5629377230059469 + }, + { + "name": "model.layers.44.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.256982937382418e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007479933556169271, + "sensitivity": 0.570133311496095 + }, + { + "name": "model.layers.44.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.767684681108221e-05, + "sensitivity": 0.8370400600689242 + }, + { + "name": "model.layers.44.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.204756341001485e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007816435536369681, + "sensitivity": 0.5120982723945207 + }, + { + "name": "model.layers.44.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.736988143529743e-05, + "sensitivity": 0.7336668493115764 + }, + { + "name": "model.layers.44.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.598043450547266e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007070849533192813, + "sensitivity": 0.5415163549213791 + }, + { + "name": "model.layers.44.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000742375326808542, + "sensitivity": 0.5500435236039959 + }, + { + "name": "model.layers.44.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.237159019903629e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.0894131264649332e-05, + "sensitivity": 1.2313641412289567 + }, + { + "name": "model.layers.44.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007257721154019237, + "sensitivity": 0.5585499546946778 + }, + { + "name": "model.layers.44.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0495266451471252e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006369700422510505, + "sensitivity": 0.5315488151272333 + }, + { + "name": "model.layers.44.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.335852958727628e-05, + "sensitivity": 0.9795409413602131 + }, + { + "name": "model.layers.44.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.144749810729991e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.478999810293317e-05, + "sensitivity": 0.6204275631611504 + }, + { + "name": "model.layers.44.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007830878021195531, + "sensitivity": 0.5738799422054301 + }, + { + "name": "model.layers.44.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.848172339843586e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007468642434105277, + "sensitivity": 0.5544485076594444 + }, + { + "name": "model.layers.44.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.627313996432349e-05, + "sensitivity": 0.644105959870115 + }, + { + "name": "model.layers.44.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0271305654896423e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007289930945262313, + "sensitivity": 0.5607562404609312 + }, + { + "name": "model.layers.44.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007721954025328159, + "sensitivity": 0.5515908613157806 + }, + { + "name": "model.layers.44.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.196650694320851e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.806873716413975e-05, + "sensitivity": 0.929522369090714 + }, + { + "name": "model.layers.44.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007949993014335632, + "sensitivity": 0.5275871646033481 + }, + { + "name": "model.layers.44.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.124289590545231e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.654994649579749e-05, + "sensitivity": 0.6430819425206679 + }, + { + "name": "model.layers.44.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.59229772281833e-05, + "sensitivity": 0.8316662776799173 + }, + { + "name": "model.layers.44.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.386949505416851e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.39895151834935e-05, + "sensitivity": 0.794329836304621 + }, + { + "name": "model.layers.44.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.436893454520032e-05, + "sensitivity": 0.6926282960702193 + }, + { + "name": "model.layers.44.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.123044269974343e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.403076986316592e-05, + "sensitivity": 0.7188266014676616 + }, + { + "name": "model.layers.44.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.547794328071177e-05, + "sensitivity": 0.8792033007484185 + }, + { + "name": "model.layers.44.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.716622242995072e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.850815796293318e-05, + "sensitivity": 0.7872208996920464 + }, + { + "name": "model.layers.44.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000717272749170661, + "sensitivity": 0.5382125644648024 + }, + { + "name": "model.layers.44.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.935664368436846e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.846089334227145e-05, + "sensitivity": 0.625244599403306 + }, + { + "name": "model.layers.44.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007473204168491066, + "sensitivity": 0.5239279682561628 + }, + { + "name": "model.layers.44.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.998266250477172e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.158660835353658e-05, + "sensitivity": 0.6388151685842007 + }, + { + "name": "model.layers.44.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007195104262791574, + "sensitivity": 0.5813269898479484 + }, + { + "name": "model.layers.44.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.692317692293727e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.233198655536398e-05, + "sensitivity": 0.6495061395144904 + }, + { + "name": "model.layers.44.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007596053183078766, + "sensitivity": 0.5453670883295056 + }, + { + "name": "model.layers.44.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.818534524834831e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007286019972525537, + "sensitivity": 0.5572768678515188 + }, + { + "name": "model.layers.44.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008138448465615511, + "sensitivity": 0.5679372511871077 + }, + { + "name": "model.layers.44.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.475268143432913e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007643378339707851, + "sensitivity": 0.5404592159465169 + }, + { + "name": "model.layers.44.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.257896929018898e-05, + "sensitivity": 1.219219530878525 + }, + { + "name": "model.layers.44.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0628253903632867e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.543216295540333e-05, + "sensitivity": 0.6299688014563213 + }, + { + "name": "model.layers.44.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008144670864567161, + "sensitivity": 0.5988046616131331 + }, + { + "name": "model.layers.44.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2030363905068953e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007409557001665235, + "sensitivity": 0.5538817924914536 + }, + { + "name": "model.layers.44.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007529780268669128, + "sensitivity": 0.5540609948291979 + }, + { + "name": "model.layers.44.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0041035238828044e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006747780134901404, + "sensitivity": 0.5362102247348453 + }, + { + "name": "model.layers.44.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007039912743493915, + "sensitivity": 0.5944380168765397 + }, + { + "name": "model.layers.44.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0169318329644739e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006306021241471171, + "sensitivity": 0.5685900808691268 + }, + { + "name": "model.layers.44.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.590255361516029e-05, + "sensitivity": 0.6908208112646494 + }, + { + "name": "model.layers.44.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2492989753809525e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006820781854912639, + "sensitivity": 0.5483611966661613 + }, + { + "name": "model.layers.44.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.79271761327982e-05, + "sensitivity": 0.7945173531893566 + }, + { + "name": "model.layers.44.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.816491572360974e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007297940319404006, + "sensitivity": 0.525159262570055 + }, + { + "name": "model.layers.44.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007416746811941266, + "sensitivity": 0.5236726085323328 + }, + { + "name": "model.layers.44.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.264289246857516e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006893199752084911, + "sensitivity": 0.5369244686755701 + }, + { + "name": "model.layers.44.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.791971827624366e-05, + "sensitivity": 0.620601214677712 + }, + { + "name": "model.layers.44.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.8975600823978311e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.996325853629969e-05, + "sensitivity": 0.7122061538959272 + }, + { + "name": "model.layers.44.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1525788977451157e-05, + "sensitivity": 1.2216221990266511 + }, + { + "name": "model.layers.44.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.102799367610714e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.466695049311966e-05, + "sensitivity": 0.674915975999408 + }, + { + "name": "model.layers.44.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007429630495607853, + "sensitivity": 0.5398022010981032 + }, + { + "name": "model.layers.44.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.316346793435514e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006879197317175567, + "sensitivity": 0.5374090369337753 + }, + { + "name": "model.layers.44.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008313389262184501, + "sensitivity": 0.5472672984432546 + }, + { + "name": "model.layers.44.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.031737135956064e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008202940225601196, + "sensitivity": 0.570002736123001 + }, + { + "name": "model.layers.44.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.603166548302397e-05, + "sensitivity": 0.7076216491883703 + }, + { + "name": "model.layers.44.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0680746527214069e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.698216020595282e-05, + "sensitivity": 0.7603605918216456 + }, + { + "name": "model.layers.44.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.696420314256102e-05, + "sensitivity": 0.8281837761046184 + }, + { + "name": "model.layers.44.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.500386456944398e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007019552285782993, + "sensitivity": 0.5453882254926399 + }, + { + "name": "model.layers.44.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.251256465679035e-05, + "sensitivity": 1.1647941312434615 + }, + { + "name": "model.layers.44.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0579399258858757e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.354296394623816e-05, + "sensitivity": 0.7743960439881242 + }, + { + "name": "model.layers.44.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007645798614248633, + "sensitivity": 0.560114160855434 + }, + { + "name": "model.layers.44.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.501494560026913e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007166076684370637, + "sensitivity": 0.5613524237335158 + }, + { + "name": "model.layers.44.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.249680154724047e-05, + "sensitivity": 0.7720597356644348 + }, + { + "name": "model.layers.44.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.280718131776666e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.34316893410869e-05, + "sensitivity": 0.6911628631263855 + }, + { + "name": "model.layers.44.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.266632746905088e-05, + "sensitivity": 0.6300447885097535 + }, + { + "name": "model.layers.44.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.653244887886103e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.816141442162916e-05, + "sensitivity": 0.6540185411302251 + }, + { + "name": "model.layers.44.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.343649874906987e-05, + "sensitivity": 0.7140350396577568 + }, + { + "name": "model.layers.44.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.245166327469633e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006859024288132787, + "sensitivity": 0.5891826090574122 + }, + { + "name": "model.layers.44.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007456468301825225, + "sensitivity": 0.5791775445499563 + }, + { + "name": "model.layers.44.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.04443970991997e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007078940980136395, + "sensitivity": 0.542839422243419 + }, + { + "name": "model.layers.44.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007623056881129742, + "sensitivity": 0.5381048850190859 + }, + { + "name": "model.layers.44.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0540120456425939e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.231208681128919e-05, + "sensitivity": 0.6364689744329334 + }, + { + "name": "model.layers.44.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007214054930955172, + "sensitivity": 0.5311143484002249 + }, + { + "name": "model.layers.44.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.663720905133232e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006334614008665085, + "sensitivity": 0.5333600968004883 + }, + { + "name": "model.layers.44.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000753675471059978, + "sensitivity": 0.5961642569228527 + }, + { + "name": "model.layers.44.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1277958265054622e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.528384983539581e-05, + "sensitivity": 0.6755461818455213 + }, + { + "name": "model.layers.44.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.45841971365735e-05, + "sensitivity": 0.6608783117646649 + }, + { + "name": "model.layers.44.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0698666983444127e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007934842724353075, + "sensitivity": 0.5702038100252409 + }, + { + "name": "model.layers.44.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007586389547213912, + "sensitivity": 0.5191057090665521 + }, + { + "name": "model.layers.44.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.136217613558983e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006996816955506802, + "sensitivity": 0.5844370328889706 + }, + { + "name": "model.layers.44.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.812562060076743e-05, + "sensitivity": 0.8555029725419618 + }, + { + "name": "model.layers.44.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1075313750552596e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007150328601710498, + "sensitivity": 0.5271277172261417 + }, + { + "name": "model.layers.44.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007386220386251807, + "sensitivity": 0.518742872844671 + }, + { + "name": "model.layers.44.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.743199941818602e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006678660283796489, + "sensitivity": 0.5461431301202322 + }, + { + "name": "model.layers.44.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.294927152339369e-05, + "sensitivity": 0.818410091139163 + }, + { + "name": "model.layers.44.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.467365321645048e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006704164552502334, + "sensitivity": 0.5619190397834481 + }, + { + "name": "model.layers.44.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007445893133990467, + "sensitivity": 0.5834456394067822 + }, + { + "name": "model.layers.44.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.524103481642669e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.989665805827826e-05, + "sensitivity": 0.9110527778662919 + }, + { + "name": "model.layers.44.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.756022048648447e-05, + "sensitivity": 0.7561394837321828 + }, + { + "name": "model.layers.44.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 7.643997719242179e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007632838096469641, + "sensitivity": 0.52548852253232 + }, + { + "name": "model.layers.44.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.094675675034523e-05, + "sensitivity": 0.8177387659972656 + }, + { + "name": "model.layers.44.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0698515779949958e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.745149585185573e-05, + "sensitivity": 0.7171505418639965 + }, + { + "name": "model.layers.44.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.273128721863031e-05, + "sensitivity": 1.0896686426673539 + }, + { + "name": "model.layers.44.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.637275772736757e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.2088055882486515e-05, + "sensitivity": 1.2219474915583042 + }, + { + "name": "model.layers.44.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.350595504045486e-05, + "sensitivity": 0.6535044166260798 + }, + { + "name": "model.layers.44.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2775096820405452e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.259721703827381e-05, + "sensitivity": 0.7063881307457813 + }, + { + "name": "model.layers.44.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0006969644455239177, + "sensitivity": 0.520083351943519 + }, + { + "name": "model.layers.44.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.637068162897776e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0006544226198457181, + "sensitivity": 0.5253550249067844 + }, + { + "name": "model.layers.44.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007302109152078629, + "sensitivity": 0.5881302104037117 + }, + { + "name": "model.layers.44.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.314170483776252e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.715731458622031e-05, + "sensitivity": 0.641668817816082 + }, + { + "name": "model.layers.44.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.1670270396280102e-05, + "sensitivity": 1.3064555404147842 + }, + { + "name": "model.layers.44.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2756634077959461e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.984999006614089e-05, + "sensitivity": 0.6487234972604823 + }, + { + "name": "model.layers.44.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.239545084303245e-05, + "sensitivity": 0.8995384246782281 + }, + { + "name": "model.layers.44.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3915672525399714e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007861024932935834, + "sensitivity": 0.5852179650140402 + }, + { + "name": "model.layers.44.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 1.3930941804574104e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.4206801779437228e-06, + "sensitivity": 2.109324169447973 + }, + { + "name": "model.layers.44.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.071534931426868e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.44.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 1.8237462882098043e-06, + "sensitivity": 2.109686841069944 + }, + { + "name": "model.layers.44.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 8.779413292359095e-06, + "sensitivity": 2.199125208609128 + }, + { + "name": "model.layers.44.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00021412920614238828, + "sensitivity": 0.8263706462301548 + }, + { + "name": "model.layers.44.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 2.0100136680412106e-05, + "sensitivity": 1.0268966674290965 + }, + { + "name": "model.layers.44.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 4.4510372390504926e-05, + "sensitivity": 0.7496715369361794 + }, + { + "name": "model.layers.44.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 3, + "mse": 0.00029851519502699375, + "sensitivity": 1.055959375796814 + }, + { + "name": "model.layers.45.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008600009023211896, + "sensitivity": 0.5435860710160527 + }, + { + "name": "model.layers.45.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.046729587680602e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000743160373531282, + "sensitivity": 0.5506728871783448 + }, + { + "name": "model.layers.45.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.024513615760952e-05, + "sensitivity": 1.1540542245304195 + }, + { + "name": "model.layers.45.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3937427638666122e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.747378938598558e-05, + "sensitivity": 1.0022106468755 + }, + { + "name": "model.layers.45.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.948078564368188e-05, + "sensitivity": 0.65736489895252 + }, + { + "name": "model.layers.45.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0747853593784384e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.615039794472978e-05, + "sensitivity": 1.1840304800767387 + }, + { + "name": "model.layers.45.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.882092904765159e-05, + "sensitivity": 0.607888938247712 + }, + { + "name": "model.layers.45.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4761275224373094e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.807036697864532e-05, + "sensitivity": 0.6419111823366458 + }, + { + "name": "model.layers.45.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.179785461630672e-05, + "sensitivity": 0.8791290221728143 + }, + { + "name": "model.layers.45.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.53728999775194e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.576157466042787e-05, + "sensitivity": 1.0350647001931104 + }, + { + "name": "model.layers.45.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008505347068421543, + "sensitivity": 0.5203128684251301 + }, + { + "name": "model.layers.45.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1934038184335805e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007341510499827564, + "sensitivity": 0.5917580637720207 + }, + { + "name": "model.layers.45.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008646544883958995, + "sensitivity": 0.549273239592306 + }, + { + "name": "model.layers.45.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.0447553197300294e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.628358096349984e-05, + "sensitivity": 0.7193673270288038 + }, + { + "name": "model.layers.45.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.52217456465587e-05, + "sensitivity": 0.832713581063116 + }, + { + "name": "model.layers.45.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.7663485323282657e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.315495506394655e-05, + "sensitivity": 0.834350547174187 + }, + { + "name": "model.layers.45.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008097131503745914, + "sensitivity": 0.5447011490242103 + }, + { + "name": "model.layers.45.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0236424259346677e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007172293844632804, + "sensitivity": 0.5842466440308783 + }, + { + "name": "model.layers.45.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008094538934528828, + "sensitivity": 0.5482884710447236 + }, + { + "name": "model.layers.45.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0045630460808752e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 5.606769991572946e-05, + "sensitivity": 0.6200274908383099 + }, + { + "name": "model.layers.45.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 8.146620530169457e-05, + "sensitivity": 0.7268170078544545 + }, + { + "name": "model.layers.45.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4117216551312595e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.241707109846175e-05, + "sensitivity": 0.7522055690562526 + }, + { + "name": "model.layers.45.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.4123094842943829e-05, + "sensitivity": 1.4735931765425454 + }, + { + "name": "model.layers.45.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4088473108131438e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.931531243026257e-05, + "sensitivity": 1.0630676238422683 + }, + { + "name": "model.layers.45.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 8.087315654847771e-05, + "sensitivity": 1.1638864973176737 + }, + { + "name": "model.layers.45.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2484970284276642e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.995428702794015e-05, + "sensitivity": 0.6666885803855858 + }, + { + "name": "model.layers.45.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0009171671117655933, + "sensitivity": 0.5847369702657312 + }, + { + "name": "model.layers.45.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.815205430641072e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.384286436717957e-05, + "sensitivity": 0.7972932179652155 + }, + { + "name": "model.layers.45.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0009095397545024753, + "sensitivity": 0.5740220731407834 + }, + { + "name": "model.layers.45.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1650809028651565e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.679140253458172e-05, + "sensitivity": 0.7787535867250746 + }, + { + "name": "model.layers.45.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 8.002850518096238e-05, + "sensitivity": 0.6098539326450604 + }, + { + "name": "model.layers.45.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.750546041686903e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008328684489242733, + "sensitivity": 0.5995219646601182 + }, + { + "name": "model.layers.45.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0009044675971381366, + "sensitivity": 0.5354644805419131 + }, + { + "name": "model.layers.45.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0524157687541447e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008785586105659604, + "sensitivity": 0.5995457089863592 + }, + { + "name": "model.layers.45.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.95809319242835e-05, + "sensitivity": 0.602592473754132 + }, + { + "name": "model.layers.45.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1103860515504493e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.494816236430779e-05, + "sensitivity": 0.6465268142636209 + }, + { + "name": "model.layers.45.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008715951698832214, + "sensitivity": 0.5560060637628348 + }, + { + "name": "model.layers.45.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.7979626818487304e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007868236862123013, + "sensitivity": 0.5655758646821407 + }, + { + "name": "model.layers.45.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.304440077859908e-05, + "sensitivity": 0.9320252594344762 + }, + { + "name": "model.layers.45.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0239521088806214e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.879839929752052e-05, + "sensitivity": 0.9652409338553909 + }, + { + "name": "model.layers.45.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000919818296097219, + "sensitivity": 0.5554920072441601 + }, + { + "name": "model.layers.45.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2060945664416067e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008803682285360992, + "sensitivity": 0.5513065051055324 + }, + { + "name": "model.layers.45.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.581223326269537e-05, + "sensitivity": 0.6335120448350059 + }, + { + "name": "model.layers.45.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2763775885105133e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.028868276393041e-05, + "sensitivity": 0.7125139518317568 + }, + { + "name": "model.layers.45.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.597616058774292e-05, + "sensitivity": 0.6395563474129953 + }, + { + "name": "model.layers.45.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4403524346562335e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.756697985110804e-05, + "sensitivity": 0.8842266949559046 + }, + { + "name": "model.layers.45.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008727246895432472, + "sensitivity": 0.5620232534408834 + }, + { + "name": "model.layers.45.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0517534292375785e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.450472574215382e-05, + "sensitivity": 0.7217371036056702 + }, + { + "name": "model.layers.45.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008798248018138111, + "sensitivity": 0.5486489822778139 + }, + { + "name": "model.layers.45.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1122886007797206e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.612383731408045e-05, + "sensitivity": 0.6152507051274791 + }, + { + "name": "model.layers.45.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008623792673461139, + "sensitivity": 0.5581546407592876 + }, + { + "name": "model.layers.45.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.575137482897844e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.101475785020739e-05, + "sensitivity": 0.6139406791663458 + }, + { + "name": "model.layers.45.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000856596976518631, + "sensitivity": 0.5436020591007983 + }, + { + "name": "model.layers.45.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0080069614559761e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.015408482402563e-05, + "sensitivity": 0.7915416014956301 + }, + { + "name": "model.layers.45.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.53757412894629e-05, + "sensitivity": 0.744623582736799 + }, + { + "name": "model.layers.45.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2846370509578264e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.957879668334499e-05, + "sensitivity": 0.6233761042501029 + }, + { + "name": "model.layers.45.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007994830375537276, + "sensitivity": 0.5615007742590838 + }, + { + "name": "model.layers.45.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1242632353969384e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.1666200407489669e-05, + "sensitivity": 1.314444718647411 + }, + { + "name": "model.layers.45.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008593471138738096, + "sensitivity": 0.5524806825242047 + }, + { + "name": "model.layers.45.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.392069273417292e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008339385385625064, + "sensitivity": 0.595661811184303 + }, + { + "name": "model.layers.45.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000833032769151032, + "sensitivity": 0.537004883534392 + }, + { + "name": "model.layers.45.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0002278258980368e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007419927860610187, + "sensitivity": 0.568868829604811 + }, + { + "name": "model.layers.45.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.707197073614225e-05, + "sensitivity": 0.7863390107230465 + }, + { + "name": "model.layers.45.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.7770371414371766e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008123075822368264, + "sensitivity": 0.5734454764030495 + }, + { + "name": "model.layers.45.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008495566435158253, + "sensitivity": 0.5838700618537951 + }, + { + "name": "model.layers.45.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0017761269409675e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.460231088567525e-05, + "sensitivity": 0.6396176944263368 + }, + { + "name": "model.layers.45.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.3489179764292203e-05, + "sensitivity": 1.3491291572207988 + }, + { + "name": "model.layers.45.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3763418564849417e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.4518842363031581e-05, + "sensitivity": 1.638372254932843 + }, + { + "name": "model.layers.45.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007727860938757658, + "sensitivity": 0.5824213722269633 + }, + { + "name": "model.layers.45.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2392486041790107e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.0481845139293e-05, + "sensitivity": 0.6221593449538874 + }, + { + "name": "model.layers.45.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 8.640624582767487e-05, + "sensitivity": 0.7051051115473276 + }, + { + "name": "model.layers.45.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.339798927801894e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.220498420996591e-05, + "sensitivity": 0.6361243893088147 + }, + { + "name": "model.layers.45.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.59319809731096e-05, + "sensitivity": 0.7761376782442868 + }, + { + "name": "model.layers.45.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0184974144067382e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007923810044303536, + "sensitivity": 0.5566104328088077 + }, + { + "name": "model.layers.45.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.591672328999266e-05, + "sensitivity": 0.7289159421644413 + }, + { + "name": "model.layers.45.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.117852207244141e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007684823940508068, + "sensitivity": 0.5969862758303993 + }, + { + "name": "model.layers.45.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 8.016926585696638e-05, + "sensitivity": 0.8013085699725335 + }, + { + "name": "model.layers.45.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.9497763332765317e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.70556871430017e-05, + "sensitivity": 0.6255811217894212 + }, + { + "name": "model.layers.45.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 8.820625953376293e-05, + "sensitivity": 0.7689361292278383 + }, + { + "name": "model.layers.45.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.50554785705026e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.391047595068812e-05, + "sensitivity": 0.6352617466701862 + }, + { + "name": "model.layers.45.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 8.332041761605069e-05, + "sensitivity": 0.7134652049651453 + }, + { + "name": "model.layers.45.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1282195373496506e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.000814079015981406, + "sensitivity": 0.5531449510710328 + }, + { + "name": "model.layers.45.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008538783877156675, + "sensitivity": 0.5921694801484423 + }, + { + "name": "model.layers.45.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0664305136742769e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.612384459003806e-05, + "sensitivity": 0.6099073000491493 + }, + { + "name": "model.layers.45.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.967992132762447e-05, + "sensitivity": 0.8802183240568815 + }, + { + "name": "model.layers.45.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.016517671814654e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.663148426217958e-05, + "sensitivity": 0.6767365173728368 + }, + { + "name": "model.layers.45.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.57361961202696e-05, + "sensitivity": 0.9463141048833418 + }, + { + "name": "model.layers.45.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2430740525815054e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.115067662904039e-05, + "sensitivity": 0.7647484654674149 + }, + { + "name": "model.layers.45.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.263537554536015e-05, + "sensitivity": 0.8983198284253251 + }, + { + "name": "model.layers.45.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.948944352800027e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.204983558040112e-05, + "sensitivity": 0.8056458139962067 + }, + { + "name": "model.layers.45.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.217511301860213e-05, + "sensitivity": 0.7975619966445967 + }, + { + "name": "model.layers.45.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.8407303059575497e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.942470645299181e-05, + "sensitivity": 0.7011462274397455 + }, + { + "name": "model.layers.45.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.486416143365204e-05, + "sensitivity": 0.6548094081062197 + }, + { + "name": "model.layers.45.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6775178437455907e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.085640052333474e-05, + "sensitivity": 0.7428441666307954 + }, + { + "name": "model.layers.45.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008079198887571692, + "sensitivity": 0.5745595502906116 + }, + { + "name": "model.layers.45.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.104953526009922e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.058688086341135e-05, + "sensitivity": 1.051264510919514 + }, + { + "name": "model.layers.45.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.257718243636191e-05, + "sensitivity": 0.9347630696326128 + }, + { + "name": "model.layers.45.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.063857212102448e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007589695742353797, + "sensitivity": 0.5928776712023085 + }, + { + "name": "model.layers.45.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.142200774978846e-05, + "sensitivity": 0.6337081658470192 + }, + { + "name": "model.layers.45.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.721343303681351e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.72074020258151e-05, + "sensitivity": 0.6764692018687412 + }, + { + "name": "model.layers.45.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0007837309967726469, + "sensitivity": 0.5977007336789903 + }, + { + "name": "model.layers.45.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 3.965688847529236e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007097739726305008, + "sensitivity": 0.5896044651783394 + }, + { + "name": "model.layers.45.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.667703903280199e-05, + "sensitivity": 0.6794212594258718 + }, + { + "name": "model.layers.45.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3990733123137034e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.335349800996482e-05, + "sensitivity": 0.691034160731711 + }, + { + "name": "model.layers.45.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 6.920025043655187e-05, + "sensitivity": 0.8619781022863682 + }, + { + "name": "model.layers.45.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4377413890542812e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.612152355955914e-05, + "sensitivity": 0.6367353813153447 + }, + { + "name": "model.layers.45.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.944137178128585e-05, + "sensitivity": 1.0409026711545604 + }, + { + "name": "model.layers.45.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 8.935154482969665e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008151166839525104, + "sensitivity": 0.5790338712880684 + }, + { + "name": "model.layers.45.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.569514855276793e-05, + "sensitivity": 0.9380654540488218 + }, + { + "name": "model.layers.45.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6169117316167103e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.306864426936954e-05, + "sensitivity": 0.9124794054286507 + }, + { + "name": "model.layers.45.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000898249913007021, + "sensitivity": 0.5997248210926773 + }, + { + "name": "model.layers.45.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.392456852045143e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.960241444176063e-05, + "sensitivity": 0.939249540965095 + }, + { + "name": "model.layers.45.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008494501817040145, + "sensitivity": 0.5814815137109908 + }, + { + "name": "model.layers.45.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.221024583894177e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.03753248672001e-05, + "sensitivity": 0.6350799936498673 + }, + { + "name": "model.layers.45.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.000905133318156004, + "sensitivity": 0.5948087874525744 + }, + { + "name": "model.layers.45.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.2555495888809673e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.207999442471191e-05, + "sensitivity": 0.6498325910795187 + }, + { + "name": "model.layers.45.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.3318956007424276e-05, + "sensitivity": 1.4048044276371554 + }, + { + "name": "model.layers.45.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1067650120821781e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.2705127119261306e-05, + "sensitivity": 1.2243219626895918 + }, + { + "name": "model.layers.45.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.650037878192961e-05, + "sensitivity": 0.607927158014021 + }, + { + "name": "model.layers.45.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0490066415513866e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0007089567370712757, + "sensitivity": 0.5794112279122521 + }, + { + "name": "model.layers.45.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 8.471207547700033e-05, + "sensitivity": 0.9166432664662603 + }, + { + "name": "model.layers.45.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2001246432191692e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.199881267501041e-05, + "sensitivity": 0.6246974648169094 + }, + { + "name": "model.layers.45.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.494653982575983e-05, + "sensitivity": 0.8525392025019264 + }, + { + "name": "model.layers.45.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 9.7172642199439e-07, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.909861258463934e-05, + "sensitivity": 0.6142372547637023 + }, + { + "name": "model.layers.45.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 7.95376327005215e-05, + "sensitivity": 0.6603417796074791 + }, + { + "name": "model.layers.45.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.518030669307336e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.560780457220972e-05, + "sensitivity": 0.6296475229566127 + }, + { + "name": "model.layers.45.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0008393779280595481, + "sensitivity": 0.5716619571933604 + }, + { + "name": "model.layers.45.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0123412721441127e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 6.464013131335378e-05, + "sensitivity": 0.6108437835235075 + }, + { + "name": "model.layers.45.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 1.8190205537393922e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 1.6067961041699164e-06, + "sensitivity": 2.1083288145833645 + }, + { + "name": "model.layers.45.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.926980636810185e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.45.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 2.0644049527618336e-06, + "sensitivity": 2.109535532406374 + }, + { + "name": "model.layers.45.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 1.013837299979059e-05, + "sensitivity": 2.2204466115840265 + }, + { + "name": "model.layers.45.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00017677027790341526, + "sensitivity": 0.8236962237716552 + }, + { + "name": "model.layers.45.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 2.1967405700706877e-05, + "sensitivity": 0.8446330295454528 + }, + { + "name": "model.layers.45.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 4.876946331933141e-05, + "sensitivity": 0.8716644334658985 + }, + { + "name": "model.layers.45.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 4, + "mse": 4.9542071792529896e-05, + "sensitivity": 1.5901123538979212 + }, + { + "name": "model.layers.46.mlp.experts.0.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00013053754810243845, + "sensitivity": 1.1540859258735257 + }, + { + "name": "model.layers.46.mlp.experts.0.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.122098521795124e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.0.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.381332736462355e-05, + "sensitivity": 0.6905156466636507 + }, + { + "name": "model.layers.46.mlp.experts.1.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010879666660912335, + "sensitivity": 0.8795830257682993 + }, + { + "name": "model.layers.46.mlp.experts.1.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.0300094547565095e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.1.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0009560708422213793, + "sensitivity": 0.5719404433138788 + }, + { + "name": "model.layers.46.mlp.experts.10.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 8.474296191707253e-05, + "sensitivity": 0.6319915408349575 + }, + { + "name": "model.layers.46.mlp.experts.10.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.8695718608796597e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.10.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.249541133409366e-05, + "sensitivity": 0.655211592740122 + }, + { + "name": "model.layers.46.mlp.experts.11.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 9.738648077473044e-05, + "sensitivity": 1.0485965012833631 + }, + { + "name": "model.layers.46.mlp.experts.11.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4594719459637417e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.11.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.301745740231127e-05, + "sensitivity": 0.6655316393403599 + }, + { + "name": "model.layers.46.mlp.experts.12.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00011350627028150484, + "sensitivity": 0.7450068331748543 + }, + { + "name": "model.layers.46.mlp.experts.12.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.154917183361249e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.12.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.293020073324442e-05, + "sensitivity": 0.7598743987749716 + }, + { + "name": "model.layers.46.mlp.experts.13.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010155553900403902, + "sensitivity": 0.6072357724480051 + }, + { + "name": "model.layers.46.mlp.experts.13.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1052422905777348e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.13.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008489048923365772, + "sensitivity": 0.5843294537520678 + }, + { + "name": "model.layers.46.mlp.experts.14.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 4.3360714698792435e-06, + "sensitivity": 2.0987240938288028 + }, + { + "name": "model.layers.46.mlp.experts.14.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.8251203073305078e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.14.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.868294389685616e-05, + "sensitivity": 0.656203764879123 + }, + { + "name": "model.layers.46.mlp.experts.15.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010342919267714024, + "sensitivity": 0.8328166200227044 + }, + { + "name": "model.layers.46.mlp.experts.15.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.7903067752486095e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.15.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.958554826676846e-05, + "sensitivity": 0.955444338274527 + }, + { + "name": "model.layers.46.mlp.experts.16.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 4.485902991291368e-06, + "sensitivity": 2.098514128802802 + }, + { + "name": "model.layers.46.mlp.experts.16.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.229585791406862e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.16.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0009584426297806203, + "sensitivity": 0.5679928447078884 + }, + { + "name": "model.layers.46.mlp.experts.17.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.8910803191829473e-05, + "sensitivity": 1.6894713475979257 + }, + { + "name": "model.layers.46.mlp.experts.17.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.991329781958484e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.17.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.333396883448586e-05, + "sensitivity": 0.6873266003535886 + }, + { + "name": "model.layers.46.mlp.experts.18.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.877342765510548e-05, + "sensitivity": 1.4557419679800532 + }, + { + "name": "model.layers.46.mlp.experts.18.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.8117798390449025e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.18.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.988658373709768e-05, + "sensitivity": 0.6511999195623991 + }, + { + "name": "model.layers.46.mlp.experts.19.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.943886309163645e-05, + "sensitivity": 1.766829465468553 + }, + { + "name": "model.layers.46.mlp.experts.19.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.7923524637808441e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.19.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.251554001821205e-05, + "sensitivity": 0.8043060136197127 + }, + { + "name": "model.layers.46.mlp.experts.2.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 2.1326462956494652e-05, + "sensitivity": 1.9145930021211206 + }, + { + "name": "model.layers.46.mlp.experts.2.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.273237896588398e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.2.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 3.756400019483408e-06, + "sensitivity": 2.1006977676448204 + }, + { + "name": "model.layers.46.mlp.experts.20.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 4.208316113363253e-06, + "sensitivity": 2.0985394743905172 + }, + { + "name": "model.layers.46.mlp.experts.20.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.8273898376719444e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.20.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.482372843194753e-05, + "sensitivity": 0.601701657246742 + }, + { + "name": "model.layers.46.mlp.experts.21.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 4.438781616045162e-06, + "sensitivity": 2.099681206521256 + }, + { + "name": "model.layers.46.mlp.experts.21.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.983027222100645e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.21.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.428702130913734e-05, + "sensitivity": 0.9091180432871573 + }, + { + "name": "model.layers.46.mlp.experts.22.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.0001066589611582458, + "sensitivity": 0.7411979167223126 + }, + { + "name": "model.layers.46.mlp.experts.22.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3109236078889808e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.22.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.679738337174058e-05, + "sensitivity": 0.609772366496049 + }, + { + "name": "model.layers.46.mlp.experts.23.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00012317218352109194, + "sensitivity": 0.6840122977627195 + }, + { + "name": "model.layers.46.mlp.experts.23.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1975281495324452e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.23.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.533964864909649e-05, + "sensitivity": 0.6582890164146779 + }, + { + "name": "model.layers.46.mlp.experts.24.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010157186625292525, + "sensitivity": 0.6479654854701529 + }, + { + "name": "model.layers.46.mlp.experts.24.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5207700698738336e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.24.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.100641571218148e-05, + "sensitivity": 0.6125182949513044 + }, + { + "name": "model.layers.46.mlp.experts.25.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010310176730854437, + "sensitivity": 1.1445992463107237 + }, + { + "name": "model.layers.46.mlp.experts.25.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.8988433794220327e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.25.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.00572379375808e-05, + "sensitivity": 0.8686785132743036 + }, + { + "name": "model.layers.46.mlp.experts.26.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00011125087621621788, + "sensitivity": 0.6579409378281863 + }, + { + "name": "model.layers.46.mlp.experts.26.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3023477549722884e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.26.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.517985017737374e-05, + "sensitivity": 0.6187835364232087 + }, + { + "name": "model.layers.46.mlp.experts.27.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 4.343546606833115e-06, + "sensitivity": 2.099172251731805 + }, + { + "name": "model.layers.46.mlp.experts.27.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.7955205748876324e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.27.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 2.0589632185874507e-05, + "sensitivity": 1.282000454345655 + }, + { + "name": "model.layers.46.mlp.experts.28.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010480178752914071, + "sensitivity": 0.9511266975472541 + }, + { + "name": "model.layers.46.mlp.experts.28.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2454079296730924e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.28.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.78891660249792e-05, + "sensitivity": 0.6212760424958272 + }, + { + "name": "model.layers.46.mlp.experts.29.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00011129312770208344, + "sensitivity": 1.045023796846907 + }, + { + "name": "model.layers.46.mlp.experts.29.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.927395715028979e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.29.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.514456905890256e-05, + "sensitivity": 0.6545094700259033 + }, + { + "name": "model.layers.46.mlp.experts.3.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010692574142012745, + "sensitivity": 0.6556030107722463 + }, + { + "name": "model.layers.46.mlp.experts.3.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.135741740654339e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.3.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008977591060101986, + "sensitivity": 0.5794994307769875 + }, + { + "name": "model.layers.46.mlp.experts.30.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 9.474702528677881e-05, + "sensitivity": 1.0185753255162837 + }, + { + "name": "model.layers.46.mlp.experts.30.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1864935913763475e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.30.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0009499727748334408, + "sensitivity": 0.5684232739227039 + }, + { + "name": "model.layers.46.mlp.experts.31.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 2.05737778742332e-05, + "sensitivity": 1.2525790323625374 + }, + { + "name": "model.layers.46.mlp.experts.31.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6598085039731814e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.31.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.280466474592686e-05, + "sensitivity": 0.6635620850512902 + }, + { + "name": "model.layers.46.mlp.experts.32.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 9.404008596902713e-05, + "sensitivity": 1.0511673175938694 + }, + { + "name": "model.layers.46.mlp.experts.32.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2180041721876478e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.32.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.113249689107761e-05, + "sensitivity": 0.74070964156838 + }, + { + "name": "model.layers.46.mlp.experts.33.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010200943506788462, + "sensitivity": 0.9590632783069597 + }, + { + "name": "model.layers.46.mlp.experts.33.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.199842927235295e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.33.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.727259410079569e-05, + "sensitivity": 1.0429055356891057 + }, + { + "name": "model.layers.46.mlp.experts.34.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 9.717916691442952e-05, + "sensitivity": 0.6967245799783546 + }, + { + "name": "model.layers.46.mlp.experts.34.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1343927326379344e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.34.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.960900984471664e-05, + "sensitivity": 0.6088278551174666 + }, + { + "name": "model.layers.46.mlp.experts.35.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010666543676052243, + "sensitivity": 0.604445307411541 + }, + { + "name": "model.layers.46.mlp.experts.35.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.996402716031298e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.35.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 3.6781354992854176e-06, + "sensitivity": 2.0995149739351646 + }, + { + "name": "model.layers.46.mlp.experts.36.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 5.305688318912871e-06, + "sensitivity": 2.0998511110087104 + }, + { + "name": "model.layers.46.mlp.experts.36.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.7987838418775937e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.36.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 0.00010054021549876779, + "sensitivity": 1.1664491375364472 + }, + { + "name": "model.layers.46.mlp.experts.37.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.001133376150391996, + "sensitivity": 0.5807802798203303 + }, + { + "name": "model.layers.46.mlp.experts.37.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.1788926005683606e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.37.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.867350697983056e-05, + "sensitivity": 0.7596439744312654 + }, + { + "name": "model.layers.46.mlp.experts.38.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010864916112041101, + "sensitivity": 0.710252310294041 + }, + { + "name": "model.layers.46.mlp.experts.38.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2010686987196095e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.38.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0008776218164712191, + "sensitivity": 0.5922126000716875 + }, + { + "name": "model.layers.46.mlp.experts.39.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.804723979148548e-05, + "sensitivity": 1.3070558627436712 + }, + { + "name": "model.layers.46.mlp.experts.39.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0657229267962975e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.39.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.90316189522855e-05, + "sensitivity": 0.6329484402872412 + }, + { + "name": "model.layers.46.mlp.experts.4.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.5606907254550606e-05, + "sensitivity": 1.5075152295087124 + }, + { + "name": "model.layers.46.mlp.experts.4.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 5.269886514724931e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.4.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.448414544342086e-05, + "sensitivity": 0.9407550949597456 + }, + { + "name": "model.layers.46.mlp.experts.40.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00011773363803513348, + "sensitivity": 0.8233412587228348 + }, + { + "name": "model.layers.46.mlp.experts.40.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6288553297272301e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.40.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0010520981159061193, + "sensitivity": 0.58472057541629 + }, + { + "name": "model.layers.46.mlp.experts.41.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.873902147053741e-05, + "sensitivity": 1.320980657590054 + }, + { + "name": "model.layers.46.mlp.experts.41.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2960615549673093e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.41.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.676039240323007e-05, + "sensitivity": 0.6065435258129059 + }, + { + "name": "model.layers.46.mlp.experts.42.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.751094350765925e-05, + "sensitivity": 1.4766472995816475 + }, + { + "name": "model.layers.46.mlp.experts.42.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.861512257368304e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.42.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 4.274795628589345e-06, + "sensitivity": 2.0990434326036955 + }, + { + "name": "model.layers.46.mlp.experts.43.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.0012073916150256991, + "sensitivity": 0.5614323236678874 + }, + { + "name": "model.layers.46.mlp.experts.43.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.421253500666353e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.43.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0009274596231989563, + "sensitivity": 0.5873822556360889 + }, + { + "name": "model.layers.46.mlp.experts.44.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010641371773090214, + "sensitivity": 0.8012652369644389 + }, + { + "name": "model.layers.46.mlp.experts.44.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.7673650063443347e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.44.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.86652123881504e-05, + "sensitivity": 0.704389329413023 + }, + { + "name": "model.layers.46.mlp.experts.45.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.7736878362484276e-05, + "sensitivity": 1.543063093501421 + }, + { + "name": "model.layers.46.mlp.experts.45.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.92630352305423e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.45.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.5093273759703152e-05, + "sensitivity": 1.2489380806178527 + }, + { + "name": "model.layers.46.mlp.experts.46.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 9.366613812744617e-05, + "sensitivity": 0.8768244266247034 + }, + { + "name": "model.layers.46.mlp.experts.46.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.0231756277789827e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.46.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0009026401676237583, + "sensitivity": 0.5817323587133575 + }, + { + "name": "model.layers.46.mlp.experts.47.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00011012342292815447, + "sensitivity": 0.8910287122249305 + }, + { + "name": "model.layers.46.mlp.experts.47.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.502993427493493e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.47.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.726939267944545e-05, + "sensitivity": 0.7940473502668739 + }, + { + "name": "model.layers.46.mlp.experts.48.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010842355550266802, + "sensitivity": 0.8101608150012826 + }, + { + "name": "model.layers.46.mlp.experts.48.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2980326573597267e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.48.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.429693454876542e-05, + "sensitivity": 0.6318005057176563 + }, + { + "name": "model.layers.46.mlp.experts.49.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 9.742174734128639e-05, + "sensitivity": 0.9750642516618144 + }, + { + "name": "model.layers.46.mlp.experts.49.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.5119048839551397e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.49.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.3263651453598868e-05, + "sensitivity": 1.644600777455261 + }, + { + "name": "model.layers.46.mlp.experts.5.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010652725177351385, + "sensitivity": 0.7083801756341188 + }, + { + "name": "model.layers.46.mlp.experts.5.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.071958533633733e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.5.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.945196168497205e-05, + "sensitivity": 0.7658374839889344 + }, + { + "name": "model.layers.46.mlp.experts.50.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 4.420996901899343e-06, + "sensitivity": 2.100853909159902 + }, + { + "name": "model.layers.46.mlp.experts.50.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.3869458800618304e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.50.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 0.0001221860875375569, + "sensitivity": 0.9823834021216635 + }, + { + "name": "model.layers.46.mlp.experts.51.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 4.28300063504139e-06, + "sensitivity": 2.1006699222196135 + }, + { + "name": "model.layers.46.mlp.experts.51.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 3.3507774332974805e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.51.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 6.529965958179673e-06, + "sensitivity": 2.1025294138970536 + }, + { + "name": "model.layers.46.mlp.experts.52.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010687959002098069, + "sensitivity": 0.7623752716758115 + }, + { + "name": "model.layers.46.mlp.experts.52.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.15448130297591e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.52.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.899572665337473e-05, + "sensitivity": 0.8429427699608418 + }, + { + "name": "model.layers.46.mlp.experts.53.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.001111392630264163, + "sensitivity": 0.5829775525710755 + }, + { + "name": "model.layers.46.mlp.experts.53.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.210277105201385e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.53.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.4761735656065866e-05, + "sensitivity": 1.2011206045893417 + }, + { + "name": "model.layers.46.mlp.experts.54.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 2, + "mse": 0.001143809175118804, + "sensitivity": 0.5909614605255281 + }, + { + "name": "model.layers.46.mlp.experts.54.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1435654414526653e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.54.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0009809763869270682, + "sensitivity": 0.549502466218953 + }, + { + "name": "model.layers.46.mlp.experts.55.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 3.4544598292995943e-06, + "sensitivity": 2.0986120611428976 + }, + { + "name": "model.layers.46.mlp.experts.55.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.38709958466643e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.55.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.689740545582026e-05, + "sensitivity": 0.8556894910267245 + }, + { + "name": "model.layers.46.mlp.experts.56.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.0001061617731465958, + "sensitivity": 0.633733003179401 + }, + { + "name": "model.layers.46.mlp.experts.56.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.2861146387876943e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.56.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.191523036453873e-05, + "sensitivity": 0.654646176216343 + }, + { + "name": "model.layers.46.mlp.experts.57.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.898840673675295e-05, + "sensitivity": 1.5125387803609518 + }, + { + "name": "model.layers.46.mlp.experts.57.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3516355465981178e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.57.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0010475933086127043, + "sensitivity": 0.5690659365014517 + }, + { + "name": "model.layers.46.mlp.experts.58.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 1.819782301026862e-05, + "sensitivity": 1.8490677158062097 + }, + { + "name": "model.layers.46.mlp.experts.58.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.6007686554075917e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.58.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 8.326483657583594e-05, + "sensitivity": 0.9632554009089189 + }, + { + "name": "model.layers.46.mlp.experts.59.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 4, + "mse": 2.346161454624962e-05, + "sensitivity": 1.252072382418025 + }, + { + "name": "model.layers.46.mlp.experts.59.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.531058615000802e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.59.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.694177626632154e-05, + "sensitivity": 1.6539339185632622 + }, + { + "name": "model.layers.46.mlp.experts.6.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 4.1555440475349315e-06, + "sensitivity": 2.1001783274159425 + }, + { + "name": "model.layers.46.mlp.experts.6.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 2.0449624571483582e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.6.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.90522894426249e-05, + "sensitivity": 0.7466088728314594 + }, + { + "name": "model.layers.46.mlp.experts.60.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 9.822245920076966e-05, + "sensitivity": 0.7367763340266343 + }, + { + "name": "model.layers.46.mlp.experts.60.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.916970177262556e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.60.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 7.404392817988992e-05, + "sensitivity": 0.7022742210057766 + }, + { + "name": "model.layers.46.mlp.experts.61.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010403658961877227, + "sensitivity": 0.602251724658996 + }, + { + "name": "model.layers.46.mlp.experts.61.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1604245173657546e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.61.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0009186958777718246, + "sensitivity": 0.5806266291238447 + }, + { + "name": "model.layers.46.mlp.experts.62.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.0001035523455357179, + "sensitivity": 1.0184639926687642 + }, + { + "name": "model.layers.46.mlp.experts.62.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.4906822798366193e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.62.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 9.227472764905542e-05, + "sensitivity": 0.6510924613941828 + }, + { + "name": "model.layers.46.mlp.experts.63.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00011185988842044026, + "sensitivity": 0.8154791655724977 + }, + { + "name": "model.layers.46.mlp.experts.63.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.828636754908075e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.63.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 3, + "mse": 0.00010190786269959062, + "sensitivity": 0.6719851156516655 + }, + { + "name": "model.layers.46.mlp.experts.7.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.0001069737336365506, + "sensitivity": 1.035304236231595 + }, + { + "name": "model.layers.46.mlp.experts.7.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3336547226572293e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.7.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0009811162017285824, + "sensitivity": 0.5917661447253096 + }, + { + "name": "model.layers.46.mlp.experts.8.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.000111205896246247, + "sensitivity": 0.645539685538388 + }, + { + "name": "model.layers.46.mlp.experts.8.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.1488540394566371e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.8.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 4, + "mse": 1.5673584130126983e-05, + "sensitivity": 1.4376614323485015 + }, + { + "name": "model.layers.46.mlp.experts.9.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 3, + "mse": 0.00010624093556543812, + "sensitivity": 1.1594959807731062 + }, + { + "name": "model.layers.46.mlp.experts.9.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 1.3168137229513377e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.experts.9.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 2, + "mse": 0.0009507543290965259, + "sensitivity": 0.5835253820331218 + }, + { + "name": "model.layers.46.mlp.gate.weight", + "shape": [ + 64, + 2048 + ], + "bits": 6, + "mse": 3.142298965030932e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.shared_experts.down_proj.weight", + "shape": [ + 2048, + 1536 + ], + "bits": 5, + "mse": 2.402887275820831e-06, + "sensitivity": 2.1124414328273495 + }, + { + "name": "model.layers.46.mlp.shared_experts.gate_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 6, + "mse": 4.825660653295927e-06, + "sensitivity": 10.0 + }, + { + "name": "model.layers.46.mlp.shared_experts.up_proj.weight", + "shape": [ + 1536, + 2048 + ], + "bits": 5, + "mse": 3.40148631039483e-06, + "sensitivity": 2.1102974568803563 + }, + { + "name": "model.layers.46.self_attn.kv_a_proj_with_mqa.weight", + "shape": [ + 576, + 2048 + ], + "bits": 5, + "mse": 8.597387932240963e-06, + "sensitivity": 2.225498087223552 + }, + { + "name": "model.layers.46.self_attn.kv_b_proj.weight", + "shape": [ + 8960, + 512 + ], + "bits": 3, + "mse": 0.00020850496366620064, + "sensitivity": 1.0691658795041334 + }, + { + "name": "model.layers.46.self_attn.o_proj.weight", + "shape": [ + 2048, + 5120 + ], + "bits": 4, + "mse": 1.890434396045748e-05, + "sensitivity": 1.5446165103703402 + }, + { + "name": "model.layers.46.self_attn.q_a_proj.weight", + "shape": [ + 768, + 2048 + ], + "bits": 3, + "mse": 3.232548988307826e-05, + "sensitivity": 0.7564150290413465 + }, + { + "name": "model.layers.46.self_attn.q_b_proj.weight", + "shape": [ + 5120, + 768 + ], + "bits": 4, + "mse": 7.500631909351796e-05, + "sensitivity": 1.3365260246052333 + } + ] +} \ No newline at end of file