{ "model_id": "zai-org/GLM-4.7-Flash", "quantization": { "method": "trellis_cuda", "min_bits": 2, "max_bits": 8, "group_size": 128, "effective_bits": 3.7848377517799006 }, "statistics": { "total_tensors": 9254, "successful": 9254, "failed": 0, "total_params": 29308747776, "avg_mse": 0.0002232240694604069, "total_time_sec": 110.36988474000009, "bit_distribution": { "2b": 2736, "3b": 2710, "4b": 575, "5b": 196, "6b": 3037 } }, "layers": [ { "name": "model.layers.0.mlp.down_proj.weight", "shape": [ 2048, 10240 ], "bits": 5, "mse": 3.0065662031120155e-06, "sensitivity": 2.0979309245857647 }, { "name": "model.layers.0.mlp.gate_proj.weight", "shape": [ 10240, 2048 ], "bits": 6, "mse": 8.390748007514048e-07, "sensitivity": 10.0 }, { "name": "model.layers.0.mlp.up_proj.weight", "shape": [ 10240, 2048 ], "bits": 3, "mse": 7.702448056079447e-05, "sensitivity": 1.153642657995318 }, { "name": "model.layers.0.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 5.357392637961311e-06, "sensitivity": 2.1543192625786647 }, { "name": "model.layers.0.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 5, "mse": 7.915920832601842e-06, "sensitivity": 2.2066540899914355 }, { "name": "model.layers.0.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 4.408653239806881e-06, "sensitivity": 1.9473644949828508 }, { "name": "model.layers.0.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 2.355716424062848e-05, "sensitivity": 0.9940753678023229 }, { "name": "model.layers.0.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 5, "mse": 9.121675248024985e-06, "sensitivity": 2.180818978882941 }, { "name": "model.layers.1.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.945580414845608e-05, "sensitivity": 1.05633246261043 }, { "name": "model.layers.1.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.088716304475383e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000706042570527643, "sensitivity": 0.5329304776870476 }, { "name": "model.layers.1.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8707199059426785e-05, "sensitivity": 1.1509562616551563 }, { "name": "model.layers.1.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.304556106646487e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.94214686518535e-05, "sensitivity": 0.7511464235585992 }, { "name": "model.layers.1.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.208647391758859e-05, "sensitivity": 0.9750583685936092 }, { "name": "model.layers.1.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.202154168022389e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007012628484517336, "sensitivity": 0.5736765453445599 }, { "name": "model.layers.1.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.852015965501778e-05, "sensitivity": 0.6750553503787329 }, { "name": "model.layers.1.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.074311045267677e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007069016573950648, "sensitivity": 0.5116522315040535 }, { "name": "model.layers.1.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.1475853979354724e-05, "sensitivity": 1.0840733054978677 }, { "name": "model.layers.1.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.388847057474777e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5915821576491e-05, "sensitivity": 0.9136558228696315 }, { "name": "model.layers.1.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.772859731223434e-05, "sensitivity": 0.7332689229887623 }, { "name": "model.layers.1.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.858658482793544e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006789648323319852, "sensitivity": 0.5273672147108106 }, { "name": "model.layers.1.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.021194712957367e-05, "sensitivity": 0.9322568931511268 }, { "name": "model.layers.1.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.647094323852798e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007528256392106414, "sensitivity": 0.5464896467410008 }, { "name": "model.layers.1.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9081932704430073e-05, "sensitivity": 0.6288406834657645 }, { "name": "model.layers.1.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.231706493053935e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007251184433698654, "sensitivity": 0.5298342810057413 }, { "name": "model.layers.1.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006876597180962563, "sensitivity": 0.5478110312226175 }, { "name": "model.layers.1.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.369790526150609e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007398161105811596, "sensitivity": 0.542743823874873 }, { "name": "model.layers.1.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006861464935354888, "sensitivity": 0.556595269158572 }, { "name": "model.layers.1.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.273803023759683e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007265096064656973, "sensitivity": 0.5431470246513287 }, { "name": "model.layers.1.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.926963684847578e-06, "sensitivity": 1.5297450242053912 }, { "name": "model.layers.1.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.700816245735041e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.883780977455899e-05, "sensitivity": 0.6514522296068361 }, { "name": "model.layers.1.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.366184970829636e-05, "sensitivity": 0.7059876012078068 }, { "name": "model.layers.1.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.651163175774855e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007717191474512219, "sensitivity": 0.5432075135849723 }, { "name": "model.layers.1.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6457949540345e-05, "sensitivity": 0.6700653032618367 }, { "name": "model.layers.1.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.894651167182019e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006909866351634264, "sensitivity": 0.5315274682237326 }, { "name": "model.layers.1.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.778695049230009e-05, "sensitivity": 0.6743638645954556 }, { "name": "model.layers.1.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.989932105876505e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.222042429726571e-05, "sensitivity": 0.6076999462716999 }, { "name": "model.layers.1.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.088727241149172e-05, "sensitivity": 0.9293144556174866 }, { "name": "model.layers.1.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.083968054961588e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.57602577120997e-05, "sensitivity": 0.6125585061286023 }, { "name": "model.layers.1.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8775298384716734e-05, "sensitivity": 0.6269297842135456 }, { "name": "model.layers.1.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.936102181498427e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007491018623113632, "sensitivity": 0.5717816080186022 }, { "name": "model.layers.1.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.712389247491956e-05, "sensitivity": 0.6017964557839103 }, { "name": "model.layers.1.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.992279739075457e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006939051672816277, "sensitivity": 0.5351029455097621 }, { "name": "model.layers.1.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0345183909521438e-05, "sensitivity": 1.2175160671256555 }, { "name": "model.layers.1.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.800407052447554e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006646983092650771, "sensitivity": 0.5437498645340249 }, { "name": "model.layers.1.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0325789844500832e-05, "sensitivity": 1.602549990546906 }, { "name": "model.layers.1.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.76636580262857e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006699999212287366, "sensitivity": 0.5617565518374802 }, { "name": "model.layers.1.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.663551200996153e-05, "sensitivity": 0.8011861740161235 }, { "name": "model.layers.1.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.255478410821524e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.39556092210114e-05, "sensitivity": 0.8260173891625407 }, { "name": "model.layers.1.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.867027721251361e-05, "sensitivity": 0.839696167916931 }, { "name": "model.layers.1.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.474218707808177e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007384248310700059, "sensitivity": 0.5318172552201543 }, { "name": "model.layers.1.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 7.762881068629213e-06, "sensitivity": 1.3919723737977423 }, { "name": "model.layers.1.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.743935045960825e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.287332507781684e-05, "sensitivity": 0.6382699162946295 }, { "name": "model.layers.1.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0072743508499116e-05, "sensitivity": 0.6848972557441011 }, { "name": "model.layers.1.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.227509175005252e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007216193480417132, "sensitivity": 0.5585915304281914 }, { "name": "model.layers.1.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.212219886947423e-05, "sensitivity": 0.6404290906497698 }, { "name": "model.layers.1.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.451672334151226e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007516718469560146, "sensitivity": 0.5154440675940664 }, { "name": "model.layers.1.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006734145572409034, "sensitivity": 0.5789922620595601 }, { "name": "model.layers.1.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.244005135158659e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007194909267127514, "sensitivity": 0.506542767829843 }, { "name": "model.layers.1.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.710440382244997e-05, "sensitivity": 0.7785803883817267 }, { "name": "model.layers.1.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.073648819437949e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006898684659972787, "sensitivity": 0.5033169345189182 }, { "name": "model.layers.1.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.526108361664228e-05, "sensitivity": 0.8204644621674357 }, { "name": "model.layers.1.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.831716407556087e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006732492474839091, "sensitivity": 0.5535000565800609 }, { "name": "model.layers.1.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.136714364401996e-05, "sensitivity": 1.062624637754448 }, { "name": "model.layers.1.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.516017947433284e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007479293271899223, "sensitivity": 0.5805955468164434 }, { "name": "model.layers.1.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6859156757127494e-05, "sensitivity": 0.6684237266059603 }, { "name": "model.layers.1.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.885818836759427e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006734858034178615, "sensitivity": 0.5321618340896571 }, { "name": "model.layers.1.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.288357351673767e-05, "sensitivity": 0.9988061100013048 }, { "name": "model.layers.1.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.394538220571121e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006305475253611803, "sensitivity": 0.5114646678925123 }, { "name": "model.layers.1.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.948065881966613e-05, "sensitivity": 0.871043374315495 }, { "name": "model.layers.1.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.139675861049909e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007124726544134319, "sensitivity": 0.5409620875025165 }, { "name": "model.layers.1.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.167671381263062e-05, "sensitivity": 0.9436389842736912 }, { "name": "model.layers.1.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.399570793291787e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007443134090863168, "sensitivity": 0.5187434612131631 }, { "name": "model.layers.1.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.017141276970506e-05, "sensitivity": 0.7414642847630519 }, { "name": "model.layers.1.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.187839289850672e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007151130121201277, "sensitivity": 0.5954510689508186 }, { "name": "model.layers.1.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007028746185824275, "sensitivity": 0.5657199560715326 }, { "name": "model.layers.1.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.586002427866333e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007675624219700694, "sensitivity": 0.5063895863360861 }, { "name": "model.layers.1.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.203779048519209e-05, "sensitivity": 0.7285713972900425 }, { "name": "model.layers.1.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.577242857019883e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007657792302779853, "sensitivity": 0.5350005813599398 }, { "name": "model.layers.1.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.045118789188564e-05, "sensitivity": 0.6051168168531535 }, { "name": "model.layers.1.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.327325081656454e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007333098910748959, "sensitivity": 0.5718397820387567 }, { "name": "model.layers.1.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006814757362008095, "sensitivity": 0.5902750491594287 }, { "name": "model.layers.1.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.376571946020704e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007336141425184906, "sensitivity": 0.5272879368864146 }, { "name": "model.layers.1.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0309031495125964e-05, "sensitivity": 1.2275653482163982 }, { "name": "model.layers.1.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.168316074057657e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.058573490008712e-05, "sensitivity": 0.8601511940648492 }, { "name": "model.layers.1.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8852114307228476e-05, "sensitivity": 0.7027394093461021 }, { "name": "model.layers.1.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.216733936525998e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007218911778181791, "sensitivity": 0.5486119794567152 }, { "name": "model.layers.1.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.813718235003762e-05, "sensitivity": 0.604454106817387 }, { "name": "model.layers.1.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.174225291033508e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007113752653822303, "sensitivity": 0.5178570242603164 }, { "name": "model.layers.1.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.241572555154562e-05, "sensitivity": 0.6704578479346931 }, { "name": "model.layers.1.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.485859103122493e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007571444730274379, "sensitivity": 0.5161457909887365 }, { "name": "model.layers.1.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9612852055579424e-05, "sensitivity": 0.6918091462587476 }, { "name": "model.layers.1.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.636150260419527e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007355489651672542, "sensitivity": 0.5288312287818265 }, { "name": "model.layers.1.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.993898957967758e-05, "sensitivity": 0.6608220765217772 }, { "name": "model.layers.1.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.3513436998619e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007413762505166233, "sensitivity": 0.5230738295211257 }, { "name": "model.layers.1.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.126197695266455e-05, "sensitivity": 0.697775647531875 }, { "name": "model.layers.1.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.526100833070814e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007590969908051193, "sensitivity": 0.5675856909411058 }, { "name": "model.layers.1.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0119404224678874e-05, "sensitivity": 0.7838928925372811 }, { "name": "model.layers.1.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.316608391898626e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007315666298381984, "sensitivity": 0.573187165551579 }, { "name": "model.layers.1.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5940356105566025e-05, "sensitivity": 1.1232700925487693 }, { "name": "model.layers.1.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.744641384808347e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006764165009371936, "sensitivity": 0.515544866960908 }, { "name": "model.layers.1.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.92915021115914e-05, "sensitivity": 0.7217744705244168 }, { "name": "model.layers.1.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.196989374984696e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007202638080343604, "sensitivity": 0.5630791192958148 }, { "name": "model.layers.1.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.810360744362697e-05, "sensitivity": 0.952676883384989 }, { "name": "model.layers.1.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.229907967281179e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007110365550033748, "sensitivity": 0.5695350375952825 }, { "name": "model.layers.1.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.003324961056933e-05, "sensitivity": 0.8604997117090291 }, { "name": "model.layers.1.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.221384865057189e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007243648869916797, "sensitivity": 0.5045773072470656 }, { "name": "model.layers.1.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.751938705448993e-06, "sensitivity": 1.3835859698943191 }, { "name": "model.layers.1.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.506403795152437e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006411081412807107, "sensitivity": 0.5951880384716677 }, { "name": "model.layers.1.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006655186880379915, "sensitivity": 0.5347733054740964 }, { "name": "model.layers.1.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.547451221194933e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007549802539870143, "sensitivity": 0.5582450191679067 }, { "name": "model.layers.1.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006968966918066144, "sensitivity": 0.5596353657531932 }, { "name": "model.layers.1.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.712450044688012e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007804572815075517, "sensitivity": 0.5130251498411098 }, { "name": "model.layers.1.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9856451116502285e-05, "sensitivity": 0.726034216473246 }, { "name": "model.layers.1.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.285960694185633e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007261476712301373, "sensitivity": 0.5328406724804157 }, { "name": "model.layers.1.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.902646080357954e-05, "sensitivity": 0.6541645299090524 }, { "name": "model.layers.1.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.98717349475919e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006953920237720013, "sensitivity": 0.545202173251164 }, { "name": "model.layers.1.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5473643442383036e-05, "sensitivity": 0.8567062361254867 }, { "name": "model.layers.1.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.672268343914766e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006545383366756141, "sensitivity": 0.5524932342585303 }, { "name": "model.layers.1.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.105279317125678e-05, "sensitivity": 0.7402823940228639 }, { "name": "model.layers.1.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.898332571836363e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007377161527983844, "sensitivity": 0.5198659536876988 }, { "name": "model.layers.1.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8163044741377234e-05, "sensitivity": 0.7491417479602756 }, { "name": "model.layers.1.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.228904112504097e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007213937933556736, "sensitivity": 0.5734752383745237 }, { "name": "model.layers.1.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9510344726732e-05, "sensitivity": 0.7350354381221457 }, { "name": "model.layers.1.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.305651822913205e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007306559709832072, "sensitivity": 0.5082377979504902 }, { "name": "model.layers.1.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006715766503475606, "sensitivity": 0.5398906733224176 }, { "name": "model.layers.1.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.236691660888027e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007296734838746488, "sensitivity": 0.49871185329574025 }, { "name": "model.layers.1.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.046460475772619e-05, "sensitivity": 0.6475521480563887 }, { "name": "model.layers.1.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.318912255665055e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007349549559876323, "sensitivity": 0.5512153371439551 }, { "name": "model.layers.1.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7738448958843946e-05, "sensitivity": 0.8059062142705675 }, { "name": "model.layers.1.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.254175559661235e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.327655137283728e-05, "sensitivity": 0.6188513324400853 }, { "name": "model.layers.1.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0171381291002035e-05, "sensitivity": 1.4806646686297573 }, { "name": "model.layers.1.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.4057363740867e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5805685406085104e-05, "sensitivity": 0.8186139180290579 }, { "name": "model.layers.1.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.053488323232159e-05, "sensitivity": 0.6792806663932732 }, { "name": "model.layers.1.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.314900247161859e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007333712419494987, "sensitivity": 0.4972852873368069 }, { "name": "model.layers.1.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006558268214575946, "sensitivity": 0.5736437222639301 }, { "name": "model.layers.1.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.132133307801269e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.312305049505085e-05, "sensitivity": 0.6402156256978115 }, { "name": "model.layers.1.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 1.2993936252314597e-05, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.5860648545640288e-06, "sensitivity": 2.097979164114025 }, { "name": "model.layers.1.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.960584748114343e-07, "sensitivity": 10.0 }, { "name": "model.layers.1.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 6.908195700816577e-06, "sensitivity": 1.7474623316197488 }, { "name": "model.layers.1.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 5.859585144207813e-06, "sensitivity": 2.1343460618200747 }, { "name": "model.layers.1.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 4, "mse": 4.448661638889462e-05, "sensitivity": 1.2595580437578628 }, { "name": "model.layers.1.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 9.338111340184696e-06, "sensitivity": 1.5287555831986808 }, { "name": "model.layers.1.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 3.1847102945903316e-05, "sensitivity": 0.8137678952447148 }, { "name": "model.layers.1.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 4, "mse": 6.655816832790151e-05, "sensitivity": 1.4344571446740946 }, { "name": "model.layers.2.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.788936323369853e-05, "sensitivity": 0.637117571081665 }, { "name": "model.layers.2.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.92528749621124e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006853381637483835, "sensitivity": 0.5292625168620071 }, { "name": "model.layers.2.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006603162037208676, "sensitivity": 0.5099343843315627 }, { "name": "model.layers.2.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.916039071962587e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006885470356792212, "sensitivity": 0.5383619701065838 }, { "name": "model.layers.2.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8043071476276964e-05, "sensitivity": 0.7901511208644407 }, { "name": "model.layers.2.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.425913170460262e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.483458128059283e-05, "sensitivity": 0.6151559787240425 }, { "name": "model.layers.2.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006500632152892649, "sensitivity": 0.5224479702307299 }, { "name": "model.layers.2.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.864437753189122e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006800758419558406, "sensitivity": 0.516434915779298 }, { "name": "model.layers.2.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006621964275836945, "sensitivity": 0.5357516082936662 }, { "name": "model.layers.2.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.296368155744858e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007026169914752245, "sensitivity": 0.5020391801268185 }, { "name": "model.layers.2.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006564076757058501, "sensitivity": 0.5291995930497548 }, { "name": "model.layers.2.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.847191459906753e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006729754386469722, "sensitivity": 0.5494191738948431 }, { "name": "model.layers.2.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006531747058033943, "sensitivity": 0.5424451453172494 }, { "name": "model.layers.2.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.043167104508029e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006917932769283652, "sensitivity": 0.5175586013374985 }, { "name": "model.layers.2.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.855287236045115e-05, "sensitivity": 0.6272529683970446 }, { "name": "model.layers.2.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.18402964391862e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007024051155894995, "sensitivity": 0.5300315797519255 }, { "name": "model.layers.2.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006588708492927253, "sensitivity": 0.5876723057827589 }, { "name": "model.layers.2.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.969351377643761e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006939381128177047, "sensitivity": 0.5733248891278955 }, { "name": "model.layers.2.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006776638329029083, "sensitivity": 0.5271574989151324 }, { "name": "model.layers.2.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.140612072158547e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007107902783900499, "sensitivity": 0.5559366843677089 }, { "name": "model.layers.2.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006497822469100356, "sensitivity": 0.5294735033525237 }, { "name": "model.layers.2.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.832420129081584e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006744188140146434, "sensitivity": 0.5231441727437001 }, { "name": "model.layers.2.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000665354251395911, "sensitivity": 0.5321946901335889 }, { "name": "model.layers.2.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.975477961328579e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006952101830393076, "sensitivity": 0.5259397434370704 }, { "name": "model.layers.2.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006540108006447554, "sensitivity": 0.5048513525104465 }, { "name": "model.layers.2.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.81134486310475e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006742709083482623, "sensitivity": 0.5262978148800059 }, { "name": "model.layers.2.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.863839032826945e-05, "sensitivity": 0.6703715924798028 }, { "name": "model.layers.2.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.938485969636531e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000688089698087424, "sensitivity": 0.5200938695271349 }, { "name": "model.layers.2.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8586061641108245e-05, "sensitivity": 0.9237234380209465 }, { "name": "model.layers.2.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.031565931152727e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006988599780015647, "sensitivity": 0.5532940274008371 }, { "name": "model.layers.2.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006515826098620892, "sensitivity": 0.5492346116743078 }, { "name": "model.layers.2.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.846945327903086e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006772064371034503, "sensitivity": 0.5522856518020094 }, { "name": "model.layers.2.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006531979888677597, "sensitivity": 0.5250952719843 }, { "name": "model.layers.2.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.833566092405817e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006774617359042168, "sensitivity": 0.5260844666104033 }, { "name": "model.layers.2.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006502066971734166, "sensitivity": 0.5359265831620937 }, { "name": "model.layers.2.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.845467399012705e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006737875519320369, "sensitivity": 0.5227271346167179 }, { "name": "model.layers.2.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006600776687264442, "sensitivity": 0.5137320249233672 }, { "name": "model.layers.2.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.987889721836837e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006912198732607067, "sensitivity": 0.5659112750063078 }, { "name": "model.layers.2.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.844603219884448e-05, "sensitivity": 0.6100404991673078 }, { "name": "model.layers.2.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.019632792231278e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006926943315193057, "sensitivity": 0.5473455438023518 }, { "name": "model.layers.2.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000651102396659553, "sensitivity": 0.5695221530731435 }, { "name": "model.layers.2.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.804732836622861e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006717864307574928, "sensitivity": 0.5350351552582775 }, { "name": "model.layers.2.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006406318861991167, "sensitivity": 0.5390368199438017 }, { "name": "model.layers.2.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.79091363306361e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006692288443446159, "sensitivity": 0.5303933995388403 }, { "name": "model.layers.2.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006477210554294288, "sensitivity": 0.5504735892614155 }, { "name": "model.layers.2.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.817384476358711e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006730208988301456, "sensitivity": 0.5196833422682965 }, { "name": "model.layers.2.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006742124678567052, "sensitivity": 0.5890436954584746 }, { "name": "model.layers.2.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.398703931154159e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00072105647996068, "sensitivity": 0.5350870112633378 }, { "name": "model.layers.2.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006554084829986095, "sensitivity": 0.53524745271771 }, { "name": "model.layers.2.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.917395355936605e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006829767371527851, "sensitivity": 0.5303733738212072 }, { "name": "model.layers.2.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006702264654450119, "sensitivity": 0.5242864592397053 }, { "name": "model.layers.2.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.053537617844995e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007012556307017803, "sensitivity": 0.5208583382292724 }, { "name": "model.layers.2.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006572377751581371, "sensitivity": 0.5776043202321025 }, { "name": "model.layers.2.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.938422873441596e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006880320142954588, "sensitivity": 0.5631608039445111 }, { "name": "model.layers.2.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006652208976447582, "sensitivity": 0.5643857546298421 }, { "name": "model.layers.2.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.969920380266558e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006962899933569133, "sensitivity": 0.5277075076174838 }, { "name": "model.layers.2.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.919697287026793e-05, "sensitivity": 0.8645927415528301 }, { "name": "model.layers.2.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.332454063340265e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007268571644090116, "sensitivity": 0.5893619816314745 }, { "name": "model.layers.2.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000657309778034687, "sensitivity": 0.5276774531742341 }, { "name": "model.layers.2.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.948190846538637e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006853543454781175, "sensitivity": 0.5117859684057103 }, { "name": "model.layers.2.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.995994069962762e-05, "sensitivity": 0.6999846551822053 }, { "name": "model.layers.2.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.337795070976426e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007308036438189447, "sensitivity": 0.5384432380359576 }, { "name": "model.layers.2.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006623267545364797, "sensitivity": 0.5345988614047849 }, { "name": "model.layers.2.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.923203616475803e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006884669419378042, "sensitivity": 0.5344720642256285 }, { "name": "model.layers.2.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006558216991834342, "sensitivity": 0.5552878261669154 }, { "name": "model.layers.2.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.95667984271131e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006911600357852876, "sensitivity": 0.558485497951545 }, { "name": "model.layers.2.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006603606743738055, "sensitivity": 0.5191522454533072 }, { "name": "model.layers.2.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.887392262593494e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006860473076812923, "sensitivity": 0.5182085053663555 }, { "name": "model.layers.2.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006595769664272666, "sensitivity": 0.5387287782824223 }, { "name": "model.layers.2.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.975117574053002e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006852728547528386, "sensitivity": 0.5401791905081401 }, { "name": "model.layers.2.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006616559694521129, "sensitivity": 0.5502344849506853 }, { "name": "model.layers.2.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.168349955260055e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007121736416593194, "sensitivity": 0.5257197859244577 }, { "name": "model.layers.2.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006602990324608982, "sensitivity": 0.5352175636436438 }, { "name": "model.layers.2.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.072373253118712e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006975110154598951, "sensitivity": 0.5253953036227406 }, { "name": "model.layers.2.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.847254578839056e-05, "sensitivity": 0.6744290943302863 }, { "name": "model.layers.2.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.976164629828418e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006898273131810129, "sensitivity": 0.5131317138379279 }, { "name": "model.layers.2.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006443810416385531, "sensitivity": 0.5364398600027781 }, { "name": "model.layers.2.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.75344472508732e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00066965795122087, "sensitivity": 0.5287747142843991 }, { "name": "model.layers.2.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006555371219292283, "sensitivity": 0.5298937326809323 }, { "name": "model.layers.2.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.863262231287081e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006783413700759411, "sensitivity": 0.5360677603850484 }, { "name": "model.layers.2.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006589422700926661, "sensitivity": 0.52567734290152 }, { "name": "model.layers.2.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.903590931666258e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006865175673738122, "sensitivity": 0.5113374437129758 }, { "name": "model.layers.2.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.056283018551767e-05, "sensitivity": 0.8130634937372851 }, { "name": "model.layers.2.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.551108526764438e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007502136286348104, "sensitivity": 0.5679884884984271 }, { "name": "model.layers.2.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006572939455509186, "sensitivity": 0.5285530080241079 }, { "name": "model.layers.2.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.910529807806597e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.103175110183656e-05, "sensitivity": 0.6974900573935633 }, { "name": "model.layers.2.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006402467261068523, "sensitivity": 0.5193772642978772 }, { "name": "model.layers.2.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.721404932046426e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006634256569668651, "sensitivity": 0.509148896437688 }, { "name": "model.layers.2.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006636054022237659, "sensitivity": 0.5575365228207116 }, { "name": "model.layers.2.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.099635356804356e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006969396490603685, "sensitivity": 0.5495433515091557 }, { "name": "model.layers.2.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006525152130052447, "sensitivity": 0.5353655557365348 }, { "name": "model.layers.2.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.896843049413292e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006843453738838434, "sensitivity": 0.5083458433448123 }, { "name": "model.layers.2.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006681729573756456, "sensitivity": 0.510966516522825 }, { "name": "model.layers.2.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.199109066074016e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007100507500581443, "sensitivity": 0.5243675741497633 }, { "name": "model.layers.2.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8295827329857275e-05, "sensitivity": 0.9484956892288682 }, { "name": "model.layers.2.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.046155931471731e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000698285351973027, "sensitivity": 0.5452995355393195 }, { "name": "model.layers.2.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006641469663009048, "sensitivity": 0.5122728100893725 }, { "name": "model.layers.2.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.08182403993851e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007040153141133487, "sensitivity": 0.52989166248 }, { "name": "model.layers.2.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006552995182573795, "sensitivity": 0.5353256304098736 }, { "name": "model.layers.2.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.916703003094881e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006831820937804878, "sensitivity": 0.5216248657576118 }, { "name": "model.layers.2.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.982746370136738e-05, "sensitivity": 0.636830613385323 }, { "name": "model.layers.2.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.224976800695003e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007242219289764762, "sensitivity": 0.524152812399479 }, { "name": "model.layers.2.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006630783900618553, "sensitivity": 0.560645864431946 }, { "name": "model.layers.2.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.085374479880556e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007047917461022735, "sensitivity": 0.5189983170325728 }, { "name": "model.layers.2.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000661292695440352, "sensitivity": 0.538721496916462 }, { "name": "model.layers.2.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.903252713324036e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006858484703116119, "sensitivity": 0.5175842759376842 }, { "name": "model.layers.2.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006530710961669683, "sensitivity": 0.5174343079627206 }, { "name": "model.layers.2.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.885612495148962e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006827026372775435, "sensitivity": 0.5384035207869178 }, { "name": "model.layers.2.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006474404945038259, "sensitivity": 0.5591837012619704 }, { "name": "model.layers.2.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.764767365690204e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000665488769300282, "sensitivity": 0.5344813831108406 }, { "name": "model.layers.2.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0248272347962484e-05, "sensitivity": 0.8088675037872083 }, { "name": "model.layers.2.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.614799303861219e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007504869136027992, "sensitivity": 0.5237759632866068 }, { "name": "model.layers.2.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006573947030119598, "sensitivity": 0.5319763064105894 }, { "name": "model.layers.2.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.943034011579584e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006883634487167001, "sensitivity": 0.5066853077842175 }, { "name": "model.layers.2.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006520501337945461, "sensitivity": 0.5203838029279557 }, { "name": "model.layers.2.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.995697733851557e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006901883753016591, "sensitivity": 0.5290526117255341 }, { "name": "model.layers.2.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006562476046383381, "sensitivity": 0.5281240206977428 }, { "name": "model.layers.2.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.860451324224414e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006805011071264744, "sensitivity": 0.5461121242462301 }, { "name": "model.layers.2.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000656422576867044, "sensitivity": 0.5200439116695399 }, { "name": "model.layers.2.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.915557608204836e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006836946122348309, "sensitivity": 0.5328029935690293 }, { "name": "model.layers.2.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006833894876763225, "sensitivity": 0.5645945286382655 }, { "name": "model.layers.2.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.547567181769409e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007568466826342046, "sensitivity": 0.5228128781431518 }, { "name": "model.layers.2.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.886183862457983e-05, "sensitivity": 0.6841249970844974 }, { "name": "model.layers.2.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.953453978690959e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006884029135107994, "sensitivity": 0.5690201736260146 }, { "name": "model.layers.2.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006462761084549129, "sensitivity": 0.5673701104285848 }, { "name": "model.layers.2.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.850297384313308e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0109508922323585e-05, "sensitivity": 1.0060064428874793 }, { "name": "model.layers.2.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006560714682564139, "sensitivity": 0.5284611704128155 }, { "name": "model.layers.2.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.948444936620945e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006893288227729499, "sensitivity": 0.5702227039931743 }, { "name": "model.layers.2.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 1.577230796101503e-05, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.7074335119104944e-06, "sensitivity": 2.098499783883584 }, { "name": "model.layers.2.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.901593229078571e-07, "sensitivity": 10.0 }, { "name": "model.layers.2.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.508206878497731e-06, "sensitivity": 2.10002572709809 }, { "name": "model.layers.2.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 7.818973244866356e-06, "sensitivity": 2.147258117697571 }, { "name": "model.layers.2.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 4, "mse": 4.0905903006205335e-05, "sensitivity": 1.6965800120929972 }, { "name": "model.layers.2.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.0648647730704397e-05, "sensitivity": 1.3951812998881747 }, { "name": "model.layers.2.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 3.31717892549932e-05, "sensitivity": 0.6802548373058802 }, { "name": "model.layers.2.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 4, "mse": 6.339624087559059e-05, "sensitivity": 1.3975228176289385 }, { "name": "model.layers.3.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.00063593580853194, "sensitivity": 0.5430232024275826 }, { "name": "model.layers.3.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.87619183534116e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006775655783712864, "sensitivity": 0.5364652703539503 }, { "name": "model.layers.3.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.091729301260784e-05, "sensitivity": 0.8758214002175702 }, { "name": "model.layers.3.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.550861826326582e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007419133326038718, "sensitivity": 0.5031770573616399 }, { "name": "model.layers.3.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006539140595123172, "sensitivity": 0.5156224245959506 }, { "name": "model.layers.3.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.041358346919878e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006979070021770895, "sensitivity": 0.5337455090844447 }, { "name": "model.layers.3.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.910659092478454e-05, "sensitivity": 0.7615865120359873 }, { "name": "model.layers.3.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.199755375746463e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007079739589244127, "sensitivity": 0.5186877673014849 }, { "name": "model.layers.3.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.741295899497345e-05, "sensitivity": 0.6104928520252837 }, { "name": "model.layers.3.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.986527185086743e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006870722281746566, "sensitivity": 0.5212532050489352 }, { "name": "model.layers.3.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9157471696380526e-05, "sensitivity": 0.7005442004099369 }, { "name": "model.layers.3.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.21246954324306e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007166705909185112, "sensitivity": 0.5068299902955895 }, { "name": "model.layers.3.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006489607039839029, "sensitivity": 0.5702282640285534 }, { "name": "model.layers.3.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.028569714544574e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000688763742800802, "sensitivity": 0.5151941100294097 }, { "name": "model.layers.3.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006581756169907749, "sensitivity": 0.562388515824322 }, { "name": "model.layers.3.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.113843369348615e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007013880531303585, "sensitivity": 0.5320735089131359 }, { "name": "model.layers.3.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.792729643872008e-05, "sensitivity": 0.6165566741934022 }, { "name": "model.layers.3.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.101906819822034e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006918259314261377, "sensitivity": 0.5277533306909968 }, { "name": "model.layers.3.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.773475277237594e-05, "sensitivity": 1.065904351227277 }, { "name": "model.layers.3.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.075218266232696e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.182939978316426e-05, "sensitivity": 0.8094881146101557 }, { "name": "model.layers.3.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.902955308556557e-05, "sensitivity": 0.6117015953663638 }, { "name": "model.layers.3.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.193683361743751e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.305395800154656e-05, "sensitivity": 0.7475151547380012 }, { "name": "model.layers.3.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.426580901257694e-05, "sensitivity": 0.633102349523764 }, { "name": "model.layers.3.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.676744763150054e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006479050498455763, "sensitivity": 0.551328686677978 }, { "name": "model.layers.3.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.48198695469182e-05, "sensitivity": 0.6350401600256882 }, { "name": "model.layers.3.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.833800855725713e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006586072267964482, "sensitivity": 0.5943592141304582 }, { "name": "model.layers.3.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006400199490599334, "sensitivity": 0.5501998948882761 }, { "name": "model.layers.3.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.879227273908327e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006750888423994184, "sensitivity": 0.5385456308886837 }, { "name": "model.layers.3.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006544290808960795, "sensitivity": 0.5306381212501703 }, { "name": "model.layers.3.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.093291062825301e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007017123280093074, "sensitivity": 0.5151548891316297 }, { "name": "model.layers.3.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000645527383312583, "sensitivity": 0.5463274425564426 }, { "name": "model.layers.3.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.935831381975731e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006828274927102029, "sensitivity": 0.5333471389618857 }, { "name": "model.layers.3.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.858881559106521e-05, "sensitivity": 0.7330903875455574 }, { "name": "model.layers.3.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.230936833162559e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006992520648054779, "sensitivity": 0.5205404914456199 }, { "name": "model.layers.3.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006345001165755093, "sensitivity": 0.554377005278974 }, { "name": "model.layers.3.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.920819035054592e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000684410217218101, "sensitivity": 0.5487942695479187 }, { "name": "model.layers.3.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7502795243635774e-05, "sensitivity": 0.6828860302131479 }, { "name": "model.layers.3.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.009514663674054e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.131693226052448e-05, "sensitivity": 0.8027049204789443 }, { "name": "model.layers.3.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006253503961488605, "sensitivity": 0.5621347816845306 }, { "name": "model.layers.3.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.734432875215134e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006615376914851367, "sensitivity": 0.5059224374696656 }, { "name": "model.layers.3.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5044372857082635e-05, "sensitivity": 0.696338610026166 }, { "name": "model.layers.3.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.73208239984524e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006520901224575937, "sensitivity": 0.5154749613399006 }, { "name": "model.layers.3.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8320682001067325e-05, "sensitivity": 0.8175322134037014 }, { "name": "model.layers.3.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.507033845082333e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007161802495829761, "sensitivity": 0.5376540225314611 }, { "name": "model.layers.3.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.683034396497533e-05, "sensitivity": 0.9988975464625485 }, { "name": "model.layers.3.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.148384841253574e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007014616276137531, "sensitivity": 0.5217756401296084 }, { "name": "model.layers.3.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006409456254914403, "sensitivity": 0.5978135238094178 }, { "name": "model.layers.3.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.939829748058401e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006849629571661353, "sensitivity": 0.548431495747174 }, { "name": "model.layers.3.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0148036380996928e-05, "sensitivity": 1.4424507097074126 }, { "name": "model.layers.3.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.016672386977007e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006866276962682605, "sensitivity": 0.5846404749955542 }, { "name": "model.layers.3.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000626497610937804, "sensitivity": 0.5449074783918296 }, { "name": "model.layers.3.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.828055691381451e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000664094346575439, "sensitivity": 0.5567688627763755 }, { "name": "model.layers.3.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006314413039945066, "sensitivity": 0.5564190051450675 }, { "name": "model.layers.3.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.917506769037573e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006772349588572979, "sensitivity": 0.5356475827492617 }, { "name": "model.layers.3.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.946636520093307e-05, "sensitivity": 0.6127192817404247 }, { "name": "model.layers.3.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.572028610207781e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007238445687107742, "sensitivity": 0.5789147539468882 }, { "name": "model.layers.3.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.965561649645679e-05, "sensitivity": 0.7090424618148079 }, { "name": "model.layers.3.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.521704563056119e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000710384629201144, "sensitivity": 0.5258531580553331 }, { "name": "model.layers.3.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6439614127157256e-05, "sensitivity": 0.6625542175648291 }, { "name": "model.layers.3.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.995320293550321e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.01209576416295e-05, "sensitivity": 0.6532757369505087 }, { "name": "model.layers.3.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.503774082171731e-05, "sensitivity": 0.6438836822286116 }, { "name": "model.layers.3.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.718124498343968e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006558168679475784, "sensitivity": 0.5197857729688911 }, { "name": "model.layers.3.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6219294492620975e-05, "sensitivity": 0.7374226579422996 }, { "name": "model.layers.3.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.879280706722056e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006719309603795409, "sensitivity": 0.5258574294089011 }, { "name": "model.layers.3.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.006429248373024e-05, "sensitivity": 1.0739160094167717 }, { "name": "model.layers.3.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.393767080226098e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007383766351267695, "sensitivity": 0.5649355831799652 }, { "name": "model.layers.3.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.762153159594163e-05, "sensitivity": 0.6793091596006905 }, { "name": "model.layers.3.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.07872038926871e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006984722567722201, "sensitivity": 0.5271541299642981 }, { "name": "model.layers.3.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.989874989609234e-05, "sensitivity": 1.0466011786443667 }, { "name": "model.layers.3.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.391964575414022e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007280685822479427, "sensitivity": 0.5081441401570113 }, { "name": "model.layers.3.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4615164117421955e-05, "sensitivity": 1.1189854924578508 }, { "name": "model.layers.3.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.781472509625019e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006547452649101615, "sensitivity": 0.5169401879797204 }, { "name": "model.layers.3.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0734313036664389e-05, "sensitivity": 1.369552824379895 }, { "name": "model.layers.3.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.147006388346199e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007067007245495915, "sensitivity": 0.5884208019055 }, { "name": "model.layers.3.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0428188033984043e-05, "sensitivity": 1.2413557413837366 }, { "name": "model.layers.3.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.269786467782978e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.279387162066996e-05, "sensitivity": 0.6032397191324705 }, { "name": "model.layers.3.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.654348569805734e-05, "sensitivity": 0.7034706375817534 }, { "name": "model.layers.3.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.896890797885135e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000680685683619231, "sensitivity": 0.5763596883582942 }, { "name": "model.layers.3.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0140966525068507e-05, "sensitivity": 0.8305808928412759 }, { "name": "model.layers.3.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.331507620416232e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007293893722817302, "sensitivity": 0.5057488615266915 }, { "name": "model.layers.3.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006461211014539003, "sensitivity": 0.5508058635562912 }, { "name": "model.layers.3.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.982010407024063e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000691656197886914, "sensitivity": 0.5308872852423764 }, { "name": "model.layers.3.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006294729537330568, "sensitivity": 0.5363988562641436 }, { "name": "model.layers.3.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.834717171637749e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000676157302223146, "sensitivity": 0.517707507129877 }, { "name": "model.layers.3.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006400012644007802, "sensitivity": 0.5314646919099445 }, { "name": "model.layers.3.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.881033757759724e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000677260453812778, "sensitivity": 0.5201251119964416 }, { "name": "model.layers.3.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.826718916068785e-05, "sensitivity": 0.7963243547561945 }, { "name": "model.layers.3.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.424131129278976e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007170999306254089, "sensitivity": 0.5605271764377608 }, { "name": "model.layers.3.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.965044692857191e-05, "sensitivity": 1.121931476295204 }, { "name": "model.layers.3.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.377862860063033e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.491619569715112e-05, "sensitivity": 0.7275503558516132 }, { "name": "model.layers.3.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.649604645441286e-05, "sensitivity": 0.9877248564071845 }, { "name": "model.layers.3.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.062484771973686e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007004417711868882, "sensitivity": 0.5217309481637598 }, { "name": "model.layers.3.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006284484989009798, "sensitivity": 0.5350580223049145 }, { "name": "model.layers.3.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.770875191046798e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8811798226088285e-05, "sensitivity": 0.6733398746406911 }, { "name": "model.layers.3.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006422955193556845, "sensitivity": 0.5505917269442313 }, { "name": "model.layers.3.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.993833269712923e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006958412704989314, "sensitivity": 0.5854761677525975 }, { "name": "model.layers.3.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006699791993014514, "sensitivity": 0.5358264929659072 }, { "name": "model.layers.3.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.198092705744784e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007099717622622848, "sensitivity": 0.5346157036245428 }, { "name": "model.layers.3.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006312435725703835, "sensitivity": 0.5251535189339226 }, { "name": "model.layers.3.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.814833912154427e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9694422816392034e-05, "sensitivity": 0.6193281486876698 }, { "name": "model.layers.3.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8780813560588285e-05, "sensitivity": 0.7231492023329549 }, { "name": "model.layers.3.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.200470465955732e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.326285802060738e-05, "sensitivity": 0.7051816550862493 }, { "name": "model.layers.3.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.654421329381876e-05, "sensitivity": 0.6031831838899582 }, { "name": "model.layers.3.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.833868499394157e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006718530785292387, "sensitivity": 0.5345202583615352 }, { "name": "model.layers.3.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.719436376239173e-05, "sensitivity": 0.9031337720154082 }, { "name": "model.layers.3.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.584708671653061e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.344912981148809e-05, "sensitivity": 0.7556124787183653 }, { "name": "model.layers.3.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006591096753254533, "sensitivity": 0.534234559632827 }, { "name": "model.layers.3.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.317984571069246e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007041746284812689, "sensitivity": 0.5190675988572403 }, { "name": "model.layers.3.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5427197366952896e-05, "sensitivity": 0.6398885719774335 }, { "name": "model.layers.3.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.706584715881036e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006582773639820516, "sensitivity": 0.5377715233347513 }, { "name": "model.layers.3.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8989502576878294e-05, "sensitivity": 0.7289309938505997 }, { "name": "model.layers.3.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.198083042363578e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.340871914289892e-05, "sensitivity": 0.6531462438374389 }, { "name": "model.layers.3.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006652008160017431, "sensitivity": 0.5171420998287919 }, { "name": "model.layers.3.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.12036728853127e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007055251626297832, "sensitivity": 0.5676039696237534 }, { "name": "model.layers.3.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006474289111793041, "sensitivity": 0.5876028630967646 }, { "name": "model.layers.3.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.983672508591553e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000688107218593359, "sensitivity": 0.5147396395345538 }, { "name": "model.layers.3.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006492796819657087, "sensitivity": 0.5222609367409197 }, { "name": "model.layers.3.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.036588615643268e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006943026091903448, "sensitivity": 0.5308839089224235 }, { "name": "model.layers.3.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006468555075116456, "sensitivity": 0.5260981794844644 }, { "name": "model.layers.3.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.986103133182041e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006897455314174294, "sensitivity": 0.5160467543670397 }, { "name": "model.layers.3.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006478052819147706, "sensitivity": 0.5387773289182812 }, { "name": "model.layers.3.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.009663593431469e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006892017554491758, "sensitivity": 0.5268405750863576 }, { "name": "model.layers.3.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006807054160162807, "sensitivity": 0.5244083928405672 }, { "name": "model.layers.3.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.457566996687092e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007268574554473162, "sensitivity": 0.5985906193100711 }, { "name": "model.layers.3.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0341043889638968e-05, "sensitivity": 1.292051315034703 }, { "name": "model.layers.3.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.742347634120961e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.618005863856524e-05, "sensitivity": 0.7489929393235137 }, { "name": "model.layers.3.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7905032008420676e-05, "sensitivity": 0.8416593950138431 }, { "name": "model.layers.3.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.132080443421728e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006992376293055713, "sensitivity": 0.5806547005250491 }, { "name": "model.layers.3.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 1.4707671653013676e-05, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.8423783103571623e-06, "sensitivity": 2.098377235895172 }, { "name": "model.layers.3.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.410683338093804e-07, "sensitivity": 10.0 }, { "name": "model.layers.3.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.288716134695278e-06, "sensitivity": 2.0998427026721727 }, { "name": "model.layers.3.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 4.266714768164093e-06, "sensitivity": 2.1413734045911217 }, { "name": "model.layers.3.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00016959359345491976, "sensitivity": 1.1131602589444205 }, { "name": "model.layers.3.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 9.776992555998731e-06, "sensitivity": 1.9396941305604074 }, { "name": "model.layers.3.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 2, "mse": 0.0004930543364025652, "sensitivity": 0.5919940435703095 }, { "name": "model.layers.3.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002845010021701455, "sensitivity": 0.7547897019998614 }, { "name": "model.layers.4.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.959023373085074e-06, "sensitivity": 1.7346312086510745 }, { "name": "model.layers.4.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.704270051865024e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006549562676809728, "sensitivity": 0.5199055569317109 }, { "name": "model.layers.4.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0713122719607782e-05, "sensitivity": 1.2416166142285858 }, { "name": "model.layers.4.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.377402996804449e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007140231318771839, "sensitivity": 0.5937989023630675 }, { "name": "model.layers.4.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.570126086240634e-05, "sensitivity": 0.9219779411151934 }, { "name": "model.layers.4.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.913018412684323e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006761299446225166, "sensitivity": 0.5182963202860243 }, { "name": "model.layers.4.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006638127379119396, "sensitivity": 0.5313759064184411 }, { "name": "model.layers.4.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.13152849382459e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007027533720247447, "sensitivity": 0.5392272895470478 }, { "name": "model.layers.4.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.153027061372995e-05, "sensitivity": 0.6808088158597838 }, { "name": "model.layers.4.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.620541057600349e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.810248305555433e-05, "sensitivity": 0.6028488418616891 }, { "name": "model.layers.4.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000610309827607125, "sensitivity": 0.5605668759695749 }, { "name": "model.layers.4.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.62465345410601e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006487327045761049, "sensitivity": 0.535803340485285 }, { "name": "model.layers.4.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7855759223457426e-05, "sensitivity": 0.6307544232643381 }, { "name": "model.layers.4.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.018855174261262e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006865696050226688, "sensitivity": 0.5187692507264638 }, { "name": "model.layers.4.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.309467163286172e-06, "sensitivity": 2.0965146858119565 }, { "name": "model.layers.4.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.221657713467721e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007054675370454788, "sensitivity": 0.5258228971118779 }, { "name": "model.layers.4.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.017951818648726e-05, "sensitivity": 0.8021256530441474 }, { "name": "model.layers.4.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.445762892326456e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007271431386470795, "sensitivity": 0.5144820788436422 }, { "name": "model.layers.4.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5640601203776896e-05, "sensitivity": 0.7938536134377926 }, { "name": "model.layers.4.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.896031325391959e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000684570986777544, "sensitivity": 0.5200069689255795 }, { "name": "model.layers.4.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7598110288381577e-05, "sensitivity": 0.9031943538194651 }, { "name": "model.layers.4.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.073951226426288e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000686062965542078, "sensitivity": 0.5316851545941069 }, { "name": "model.layers.4.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.564516322920099e-05, "sensitivity": 0.7047255894974899 }, { "name": "model.layers.4.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.906859996684943e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006784327561035752, "sensitivity": 0.5095191294543889 }, { "name": "model.layers.4.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.516660611552652e-06, "sensitivity": 1.4334432828157406 }, { "name": "model.layers.4.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.523261847883987e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006367077003233135, "sensitivity": 0.5787417372964158 }, { "name": "model.layers.4.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8555036957841367e-05, "sensitivity": 0.8164007384490011 }, { "name": "model.layers.4.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.308707156676974e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007151543977670372, "sensitivity": 0.5201783077886792 }, { "name": "model.layers.4.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.743873043684289e-05, "sensitivity": 0.8079103575090971 }, { "name": "model.layers.4.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.912332881052862e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006763706333003938, "sensitivity": 0.5778736155851006 }, { "name": "model.layers.4.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8498946600593626e-05, "sensitivity": 0.632088950096355 }, { "name": "model.layers.4.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.227319317986257e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000708900042809546, "sensitivity": 0.5239415335722322 }, { "name": "model.layers.4.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8306133723817766e-05, "sensitivity": 0.7203242586609653 }, { "name": "model.layers.4.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.970799747956335e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.063139153411612e-05, "sensitivity": 0.6428740079972061 }, { "name": "model.layers.4.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7433993788436055e-05, "sensitivity": 1.0890961528421093 }, { "name": "model.layers.4.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.148197257971333e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000705514510627836, "sensitivity": 0.5070438651210525 }, { "name": "model.layers.4.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.1027269111946225e-05, "sensitivity": 0.7232989010540429 }, { "name": "model.layers.4.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.530676728289109e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007466083625331521, "sensitivity": 0.5402790039990331 }, { "name": "model.layers.4.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9017234889324754e-05, "sensitivity": 1.0965640101616998 }, { "name": "model.layers.4.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.272433665799326e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007178797386586666, "sensitivity": 0.509755462156742 }, { "name": "model.layers.4.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7358101912541315e-05, "sensitivity": 0.8958166245357477 }, { "name": "model.layers.4.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.074166094549582e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007001352496445179, "sensitivity": 0.5112674749472584 }, { "name": "model.layers.4.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.433113983599469e-05, "sensitivity": 0.7794476399656942 }, { "name": "model.layers.4.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.944759777776198e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006729679880663753, "sensitivity": 0.5240349029615421 }, { "name": "model.layers.4.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.609160770196468e-06, "sensitivity": 1.2677153086862711 }, { "name": "model.layers.4.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.717171234209673e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006343355635181069, "sensitivity": 0.5342927937585691 }, { "name": "model.layers.4.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4938122048042715e-05, "sensitivity": 0.8171639088829395 }, { "name": "model.layers.4.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.81988842895953e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006602167850360274, "sensitivity": 0.5300885906130786 }, { "name": "model.layers.4.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.506798333954066e-05, "sensitivity": 0.704250212740196 }, { "name": "model.layers.4.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.852811000295333e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006746356375515461, "sensitivity": 0.554251167275761 }, { "name": "model.layers.4.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3919513447908685e-05, "sensitivity": 1.023908276174196 }, { "name": "model.layers.4.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.751232947659446e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006607001414522529, "sensitivity": 0.5582343361133111 }, { "name": "model.layers.4.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7377066696062684e-05, "sensitivity": 1.0741872383486537 }, { "name": "model.layers.4.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.193357648953679e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007175027276389301, "sensitivity": 0.5317101716642794 }, { "name": "model.layers.4.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.796353070763871e-05, "sensitivity": 0.6159290997042038 }, { "name": "model.layers.4.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.995516403345391e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006896600825712085, "sensitivity": 0.524997326269811 }, { "name": "model.layers.4.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.646081262966618e-05, "sensitivity": 0.865569014339094 }, { "name": "model.layers.4.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.977705086479546e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006867594784125686, "sensitivity": 0.5296383521306762 }, { "name": "model.layers.4.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.377529305405915e-05, "sensitivity": 1.091944070853306 }, { "name": "model.layers.4.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.929414328420535e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006854366511106491, "sensitivity": 0.571029937491516 }, { "name": "model.layers.4.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.49130309082102e-05, "sensitivity": 0.8289599335219076 }, { "name": "model.layers.4.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.077071361687558e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006736404611729085, "sensitivity": 0.52190277428335 }, { "name": "model.layers.4.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.949939804850146e-05, "sensitivity": 0.7021213464657461 }, { "name": "model.layers.4.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.466201512012049e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007363377371802926, "sensitivity": 0.5240762317457173 }, { "name": "model.layers.4.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0485124221304432e-05, "sensitivity": 1.2091829771167604 }, { "name": "model.layers.4.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.355311370498384e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007276776013895869, "sensitivity": 0.5350684047084941 }, { "name": "model.layers.4.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.0414713768986985e-05, "sensitivity": 1.1954192346210963 }, { "name": "model.layers.4.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.342640747585392e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.245885404292494e-05, "sensitivity": 0.6884716238135367 }, { "name": "model.layers.4.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.1937235032964963e-06, "sensitivity": 2.016860345775247 }, { "name": "model.layers.4.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.930723432356899e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006739184027537704, "sensitivity": 0.5483003430478943 }, { "name": "model.layers.4.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.823510582558811e-05, "sensitivity": 0.6324875784644 }, { "name": "model.layers.4.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.320157126538106e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007200042600743473, "sensitivity": 0.551155942535246 }, { "name": "model.layers.4.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.438040534500033e-05, "sensitivity": 0.9350599601086184 }, { "name": "model.layers.4.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.0775931842727e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.78917060920503e-05, "sensitivity": 0.7650789000076501 }, { "name": "model.layers.4.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.909376704948954e-05, "sensitivity": 0.8202056554845505 }, { "name": "model.layers.4.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.100538030295866e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000704023870639503, "sensitivity": 0.5285862520875373 }, { "name": "model.layers.4.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.693483035429381e-05, "sensitivity": 0.8736741529223327 }, { "name": "model.layers.4.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.222966248969897e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007106876000761986, "sensitivity": 0.583445400294085 }, { "name": "model.layers.4.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.017299892846495e-05, "sensitivity": 0.6698673774459906 }, { "name": "model.layers.4.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.503350959974341e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007395264692604542, "sensitivity": 0.5700756284276312 }, { "name": "model.layers.4.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.209360097069293e-05, "sensitivity": 1.0926622424704369 }, { "name": "model.layers.4.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.496142989613872e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006210344727151096, "sensitivity": 0.5283334296229076 }, { "name": "model.layers.4.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.060933810658753e-05, "sensitivity": 0.7141256202946706 }, { "name": "model.layers.4.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.611483058804879e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007574378396384418, "sensitivity": 0.5309336864195771 }, { "name": "model.layers.4.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5278953368542716e-05, "sensitivity": 0.6024113454213506 }, { "name": "model.layers.4.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.88068814977305e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000673910602927208, "sensitivity": 0.5348970477030579 }, { "name": "model.layers.4.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.725361451273784e-06, "sensitivity": 1.534273639951054 }, { "name": "model.layers.4.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.860005103386356e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006267968565225601, "sensitivity": 0.5489913871802142 }, { "name": "model.layers.4.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.67998577025719e-05, "sensitivity": 1.1807153799036776 }, { "name": "model.layers.4.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.182884817462764e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006991793634369969, "sensitivity": 0.5185081241337985 }, { "name": "model.layers.4.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.039304152072873e-05, "sensitivity": 1.3038230169811424 }, { "name": "model.layers.4.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.002355235068535e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006890959921292961, "sensitivity": 0.5297047279403019 }, { "name": "model.layers.4.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5416327086277306e-05, "sensitivity": 0.9179303270804696 }, { "name": "model.layers.4.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.009824460306845e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006637977785430849, "sensitivity": 0.5522048112531788 }, { "name": "model.layers.4.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.630448868032545e-05, "sensitivity": 0.8070689799551635 }, { "name": "model.layers.4.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.955032520432724e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006774622015655041, "sensitivity": 0.5880112787340146 }, { "name": "model.layers.4.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0157731594517827e-05, "sensitivity": 1.2135542491252087 }, { "name": "model.layers.4.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.545716016466031e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.038389983586967e-05, "sensitivity": 0.9323589220151864 }, { "name": "model.layers.4.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.676992704044096e-06, "sensitivity": 1.2849825942595428 }, { "name": "model.layers.4.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.675686907125055e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006298433290794492, "sensitivity": 0.5061507542744497 }, { "name": "model.layers.4.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.576513548381627e-06, "sensitivity": 1.3848172265230652 }, { "name": "model.layers.4.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.680072945324355e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5492269893875346e-05, "sensitivity": 0.6275082632314002 }, { "name": "model.layers.4.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.768839764641598e-05, "sensitivity": 0.7287039377070708 }, { "name": "model.layers.4.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.140807613519428e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000706191174685955, "sensitivity": 0.5502893097144734 }, { "name": "model.layers.4.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0309846402378753e-05, "sensitivity": 1.4476616898373786 }, { "name": "model.layers.4.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.682955131509516e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.3294981373474e-05, "sensitivity": 0.7825293612413317 }, { "name": "model.layers.4.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.719540058635175e-05, "sensitivity": 0.8004786904564992 }, { "name": "model.layers.4.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.98266524320934e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0802831285400316e-05, "sensitivity": 0.7692693835377475 }, { "name": "model.layers.4.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006590033881366253, "sensitivity": 0.5382897472288203 }, { "name": "model.layers.4.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.168420441099443e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007029214175418019, "sensitivity": 0.533473039544969 }, { "name": "model.layers.4.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0979662874888163e-05, "sensitivity": 1.4187784956459988 }, { "name": "model.layers.4.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.304548492153117e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007192965131253004, "sensitivity": 0.5147991117689501 }, { "name": "model.layers.4.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006418500561267138, "sensitivity": 0.5357255908001842 }, { "name": "model.layers.4.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.123759703768883e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.1001726862741634e-05, "sensitivity": 0.7788451550669223 }, { "name": "model.layers.4.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006414218223653734, "sensitivity": 0.5724397024626909 }, { "name": "model.layers.4.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.955604933660652e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006735196220688522, "sensitivity": 0.5213538938587077 }, { "name": "model.layers.4.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6913384469226e-05, "sensitivity": 0.7962210879346985 }, { "name": "model.layers.4.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.287492624323932e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007062514196150005, "sensitivity": 0.52689865220847 }, { "name": "model.layers.4.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6400713219773024e-05, "sensitivity": 1.1258377371068682 }, { "name": "model.layers.4.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.121783258095093e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006909125950187445, "sensitivity": 0.5351683018522232 }, { "name": "model.layers.4.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.836490890942514e-05, "sensitivity": 0.7554787803486829 }, { "name": "model.layers.4.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.338881917145045e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.446975748986006e-05, "sensitivity": 0.7499779706196759 }, { "name": "model.layers.4.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.48386968957493e-06, "sensitivity": 1.6020962215949133 }, { "name": "model.layers.4.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.603965291811619e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5742901167832315e-05, "sensitivity": 0.6006346031555789 }, { "name": "model.layers.4.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7089910114882514e-05, "sensitivity": 0.642136559694088 }, { "name": "model.layers.4.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.960771432000911e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006843778537586331, "sensitivity": 0.5418152861423355 }, { "name": "model.layers.4.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.311377390171401e-05, "sensitivity": 1.1746644346618864 }, { "name": "model.layers.4.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.518805892279488e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006235972978174686, "sensitivity": 0.5478413725982015 }, { "name": "model.layers.4.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 1.053935193340294e-05, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.814705228753155e-06, "sensitivity": 2.0985073355307877 }, { "name": "model.layers.4.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.592649010097375e-07, "sensitivity": 10.0 }, { "name": "model.layers.4.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.258909605894587e-06, "sensitivity": 2.1021021817516923 }, { "name": "model.layers.4.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 4.3304680730216205e-06, "sensitivity": 2.139205155040418 }, { "name": "model.layers.4.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00015503790928050876, "sensitivity": 1.0655228926901876 }, { "name": "model.layers.4.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 8.80186416907236e-06, "sensitivity": 1.8968979120843217 }, { "name": "model.layers.4.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 4.173161505605094e-05, "sensitivity": 0.6830911372138859 }, { "name": "model.layers.4.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002661650942172855, "sensitivity": 0.8965080881700844 }, { "name": "model.layers.5.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.174215039005503e-05, "sensitivity": 0.9843739150451165 }, { "name": "model.layers.5.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.564810408031917e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5830976634752005e-05, "sensitivity": 0.6337483774187305 }, { "name": "model.layers.5.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.842257814947516e-05, "sensitivity": 0.6932919515382885 }, { "name": "model.layers.5.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.355699611049204e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007030800334177911, "sensitivity": 0.516178696787411 }, { "name": "model.layers.5.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.353846790967509e-05, "sensitivity": 0.6973962512973638 }, { "name": "model.layers.5.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.496877406585554e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006247282726690173, "sensitivity": 0.5252865660808536 }, { "name": "model.layers.5.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3906591347185895e-05, "sensitivity": 1.0536377867547408 }, { "name": "model.layers.5.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.070972062843794e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006397582474164665, "sensitivity": 0.5386142481473728 }, { "name": "model.layers.5.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.2231858717277646e-05, "sensitivity": 1.033181185567674 }, { "name": "model.layers.5.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.714136364076694e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006197073380462825, "sensitivity": 0.519867892027612 }, { "name": "model.layers.5.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.725809023715556e-05, "sensitivity": 0.7073294208690512 }, { "name": "model.layers.5.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.491961244137201e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006804433651268482, "sensitivity": 0.545881503122309 }, { "name": "model.layers.5.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.329336611088365e-05, "sensitivity": 1.0075511456440052 }, { "name": "model.layers.5.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.834799819444015e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007530195871368051, "sensitivity": 0.5154840169960146 }, { "name": "model.layers.5.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.605082697002217e-05, "sensitivity": 0.7955405343898763 }, { "name": "model.layers.5.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.295622370089404e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.029677751939744e-05, "sensitivity": 0.6594708535753782 }, { "name": "model.layers.5.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.260434126190376e-06, "sensitivity": 1.6321710367623246 }, { "name": "model.layers.5.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.53603456410201e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 4.891031130682677e-05, "sensitivity": 0.7298765596884031 }, { "name": "model.layers.5.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006408148328773677, "sensitivity": 0.5253962529194666 }, { "name": "model.layers.5.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.203899829415604e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006920511368662119, "sensitivity": 0.5587104692515144 }, { "name": "model.layers.5.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006581306224688888, "sensitivity": 0.5502422445742864 }, { "name": "model.layers.5.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.373737733156304e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007101836381480098, "sensitivity": 0.5422364777205122 }, { "name": "model.layers.5.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.924526340095326e-05, "sensitivity": 0.7175679843428365 }, { "name": "model.layers.5.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.334136628538545e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007063177181407809, "sensitivity": 0.5203362484609253 }, { "name": "model.layers.5.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.671524195349775e-05, "sensitivity": 0.8008182676364874 }, { "name": "model.layers.5.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.309321634034859e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006944822962395847, "sensitivity": 0.5168646184662502 }, { "name": "model.layers.5.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.702851194655523e-05, "sensitivity": 0.679463559976049 }, { "name": "model.layers.5.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.206001899045077e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006879428401589394, "sensitivity": 0.5593631946767503 }, { "name": "model.layers.5.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.646301360684447e-05, "sensitivity": 1.0021351770682114 }, { "name": "model.layers.5.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.195568289513176e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.922857599216513e-05, "sensitivity": 0.6967542960491347 }, { "name": "model.layers.5.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006509709055535495, "sensitivity": 0.5423859156865167 }, { "name": "model.layers.5.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.079944796510972e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006791597115807235, "sensitivity": 0.539600425108096 }, { "name": "model.layers.5.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6305507314391434e-05, "sensitivity": 0.9211884975750875 }, { "name": "model.layers.5.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.026019150340289e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006643926026299596, "sensitivity": 0.5172849654929196 }, { "name": "model.layers.5.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.77859282202553e-05, "sensitivity": 0.7549833002091353 }, { "name": "model.layers.5.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.586571998923318e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006818104302510619, "sensitivity": 0.5349807192449223 }, { "name": "model.layers.5.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.907707964070141e-05, "sensitivity": 0.6574790652188588 }, { "name": "model.layers.5.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.213359142748232e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006978644523769617, "sensitivity": 0.5982525898963724 }, { "name": "model.layers.5.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.580030119745061e-05, "sensitivity": 0.7748379942589774 }, { "name": "model.layers.5.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.89624733038363e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006567444070242345, "sensitivity": 0.541440914901235 }, { "name": "model.layers.5.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006629341514781117, "sensitivity": 0.5304558146363014 }, { "name": "model.layers.5.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.269876848818967e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007067201077006757, "sensitivity": 0.5168499046006105 }, { "name": "model.layers.5.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5823660659370944e-05, "sensitivity": 0.6864141336217173 }, { "name": "model.layers.5.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.477018246187072e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006932415417395532, "sensitivity": 0.5659518007170097 }, { "name": "model.layers.5.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0476388524693903e-05, "sensitivity": 1.2095679327853468 }, { "name": "model.layers.5.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.940011078564567e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006665707915090024, "sensitivity": 0.5539298415861739 }, { "name": "model.layers.5.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.00069728511152789, "sensitivity": 0.515991068608581 }, { "name": "model.layers.5.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.440546940211789e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007280634599737823, "sensitivity": 0.5293168124723057 }, { "name": "model.layers.5.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000653837516438216, "sensitivity": 0.54288689908718 }, { "name": "model.layers.5.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.920973080719705e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006751860491931438, "sensitivity": 0.5221701424280901 }, { "name": "model.layers.5.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006429021595977247, "sensitivity": 0.5684686334327551 }, { "name": "model.layers.5.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.96036727529281e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9974972828058526e-05, "sensitivity": 0.7781045262221374 }, { "name": "model.layers.5.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.555509414989501e-05, "sensitivity": 0.9789941479521471 }, { "name": "model.layers.5.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.478286991296045e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7846667914418504e-05, "sensitivity": 0.6565027945488117 }, { "name": "model.layers.5.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.553921073442325e-05, "sensitivity": 0.6710317476266412 }, { "name": "model.layers.5.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.006390549373464e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006742792902514338, "sensitivity": 0.5234245461923936 }, { "name": "model.layers.5.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.029563554766355e-05, "sensitivity": 1.5892542250939614 }, { "name": "model.layers.5.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.095878575251845e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006657556514255702, "sensitivity": 0.556324773196202 }, { "name": "model.layers.5.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.908549792366102e-05, "sensitivity": 0.6664558343050853 }, { "name": "model.layers.5.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.301902431005146e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.134063733043149e-05, "sensitivity": 0.734975632915761 }, { "name": "model.layers.5.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006507124635390937, "sensitivity": 0.5654197298507033 }, { "name": "model.layers.5.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.145363613541122e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006953277625143528, "sensitivity": 0.5780345991652724 }, { "name": "model.layers.5.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000635674805380404, "sensitivity": 0.5918118877563743 }, { "name": "model.layers.5.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.228787015061243e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006791693158447742, "sensitivity": 0.535816339537792 }, { "name": "model.layers.5.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.716276791645214e-05, "sensitivity": 0.787391963237162 }, { "name": "model.layers.5.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.880636990696075e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.029927681083791e-05, "sensitivity": 0.6125050699529027 }, { "name": "model.layers.5.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006542237242683768, "sensitivity": 0.5257367007978292 }, { "name": "model.layers.5.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.196625008669798e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006931214011274278, "sensitivity": 0.5145138811849617 }, { "name": "model.layers.5.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.656527355313301e-05, "sensitivity": 0.6811943924738636 }, { "name": "model.layers.5.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.200555162649835e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.873247209819965e-05, "sensitivity": 0.6020323996354071 }, { "name": "model.layers.5.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3241787099977955e-05, "sensitivity": 1.1338179137785596 }, { "name": "model.layers.5.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.613159146378166e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000610903836786747, "sensitivity": 0.5718141096041045 }, { "name": "model.layers.5.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.801324005005881e-05, "sensitivity": 0.612484346857023 }, { "name": "model.layers.5.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.292070793278981e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.976529064355418e-05, "sensitivity": 0.9273112634952105 }, { "name": "model.layers.5.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.864018385182135e-05, "sensitivity": 0.7857327125953946 }, { "name": "model.layers.5.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.289542398008052e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007019054028205574, "sensitivity": 0.5346692669026316 }, { "name": "model.layers.5.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7246070355176926e-05, "sensitivity": 0.6343480853423501 }, { "name": "model.layers.5.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.344206440189737e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006717690266668797, "sensitivity": 0.5292566951553956 }, { "name": "model.layers.5.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.837646313011646e-05, "sensitivity": 0.7265412878152719 }, { "name": "model.layers.5.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.604503823837149e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000697412877343595, "sensitivity": 0.5925325553723992 }, { "name": "model.layers.5.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006463145255111158, "sensitivity": 0.5488669948915348 }, { "name": "model.layers.5.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.012177209413494e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000682407699059695, "sensitivity": 0.5244532954282681 }, { "name": "model.layers.5.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.2830815548077226e-05, "sensitivity": 0.7663910631837445 }, { "name": "model.layers.5.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.597265726464684e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006347924936562777, "sensitivity": 0.5088161255018706 }, { "name": "model.layers.5.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006716195493936539, "sensitivity": 0.5396696316802261 }, { "name": "model.layers.5.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.201529458849109e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007049547275528312, "sensitivity": 0.5411393825692137 }, { "name": "model.layers.5.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.735183003707789e-05, "sensitivity": 0.6703659877324708 }, { "name": "model.layers.5.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.314721190392447e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007044244557619095, "sensitivity": 0.5172087733663017 }, { "name": "model.layers.5.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4064392315922305e-05, "sensitivity": 0.6419389805097342 }, { "name": "model.layers.5.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.894686978535901e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006561823538504541, "sensitivity": 0.5510746407303759 }, { "name": "model.layers.5.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000687027582898736, "sensitivity": 0.5375959837789887 }, { "name": "model.layers.5.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.399092171704979e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000719776377081871, "sensitivity": 0.5337910396441834 }, { "name": "model.layers.5.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.596328264800832e-05, "sensitivity": 0.8432147504930958 }, { "name": "model.layers.5.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.925926416239236e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006601737695746124, "sensitivity": 0.5082670036480471 }, { "name": "model.layers.5.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.434603008325212e-05, "sensitivity": 0.7519967508570867 }, { "name": "model.layers.5.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.729173153667944e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006471384549513459, "sensitivity": 0.5674974044724468 }, { "name": "model.layers.5.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.743532528867945e-05, "sensitivity": 0.7210069684863524 }, { "name": "model.layers.5.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.20418347807572e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.957320536253974e-05, "sensitivity": 0.944383109278147 }, { "name": "model.layers.5.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.49894092627801e-06, "sensitivity": 1.4650584383291423 }, { "name": "model.layers.5.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.308693289407529e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006015264661982656, "sensitivity": 0.5255526858640602 }, { "name": "model.layers.5.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.362502270145342e-05, "sensitivity": 0.7566271527572925 }, { "name": "model.layers.5.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.930090765104978e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006570519763045013, "sensitivity": 0.5144489605770642 }, { "name": "model.layers.5.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.573302769334987e-05, "sensitivity": 0.7258019505556463 }, { "name": "model.layers.5.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.769873041572282e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006574344588443637, "sensitivity": 0.5264402729860789 }, { "name": "model.layers.5.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006444156169891357, "sensitivity": 0.5681259950445033 }, { "name": "model.layers.5.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.934213618274953e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.00707862759009e-05, "sensitivity": 0.6244539378251253 }, { "name": "model.layers.5.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.686370423063636e-05, "sensitivity": 0.6800411359730371 }, { "name": "model.layers.5.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.917224825680023e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006606096867471933, "sensitivity": 0.5469396662930713 }, { "name": "model.layers.5.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3335090342443436e-05, "sensitivity": 0.6839447914009902 }, { "name": "model.layers.5.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.89446699450491e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.844645056640729e-05, "sensitivity": 0.6789151255553665 }, { "name": "model.layers.5.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.313480505719781e-05, "sensitivity": 0.8584333073414157 }, { "name": "model.layers.5.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.694774927178514e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006270682788453996, "sensitivity": 0.5300546855743993 }, { "name": "model.layers.5.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.604553734883666e-05, "sensitivity": 0.6272113452550139 }, { "name": "model.layers.5.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.172410280669283e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006582462228834629, "sensitivity": 0.510560418248403 }, { "name": "model.layers.5.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5765056458767503e-05, "sensitivity": 0.7189735787208792 }, { "name": "model.layers.5.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.850014304087381e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006653275340795517, "sensitivity": 0.5232196949510948 }, { "name": "model.layers.5.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.578563650487922e-05, "sensitivity": 1.0818392452655214 }, { "name": "model.layers.5.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.973244583401538e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006656750338152051, "sensitivity": 0.5284393022162583 }, { "name": "model.layers.5.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4715397709514946e-05, "sensitivity": 1.1575811033805428 }, { "name": "model.layers.5.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.734704586757289e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.585952749243006e-05, "sensitivity": 0.6698928650932614 }, { "name": "model.layers.5.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.115920405136421e-05, "sensitivity": 0.9585933714760068 }, { "name": "model.layers.5.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.284325877459196e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.330998439807445e-05, "sensitivity": 0.6000029916787292 }, { "name": "model.layers.5.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.215398778091185e-05, "sensitivity": 0.7472831733199926 }, { "name": "model.layers.5.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.608684432445443e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006313082994893193, "sensitivity": 0.5473204568801391 }, { "name": "model.layers.5.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.805590990348719e-05, "sensitivity": 0.8599827505317831 }, { "name": "model.layers.5.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.342478400256368e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.303254485828802e-05, "sensitivity": 0.9845943170226459 }, { "name": "model.layers.5.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3094069092621794e-06, "sensitivity": 2.0972684463764555 }, { "name": "model.layers.5.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.186810423969291e-07, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.1210961019969545e-05, "sensitivity": 1.2071490709379562 }, { "name": "model.layers.5.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 9.185856470139697e-06, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.7325196495221462e-06, "sensitivity": 2.098507133975826 }, { "name": "model.layers.5.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0104139391842182e-06, "sensitivity": 10.0 }, { "name": "model.layers.5.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.3220778782851994e-06, "sensitivity": 2.102846579004364 }, { "name": "model.layers.5.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 5.372161467676051e-06, "sensitivity": 2.1550550172764646 }, { "name": "model.layers.5.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.0001751558593241498, "sensitivity": 1.179238173833278 }, { "name": "model.layers.5.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 9.56397252593888e-06, "sensitivity": 1.8177267036929416 }, { "name": "model.layers.5.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 2, "mse": 0.0005624552140943706, "sensitivity": 0.5275247361843922 }, { "name": "model.layers.5.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002904439461417496, "sensitivity": 1.0437565429407842 }, { "name": "model.layers.6.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006554018473252654, "sensitivity": 0.5322259067099371 }, { "name": "model.layers.6.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.044321025910904e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006911138771101832, "sensitivity": 0.5541707118329273 }, { "name": "model.layers.6.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.313691508490592e-05, "sensitivity": 1.1504621314023844 }, { "name": "model.layers.6.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.754645826527849e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006393723888322711, "sensitivity": 0.5836531099395504 }, { "name": "model.layers.6.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000657164491713047, "sensitivity": 0.5740225757954931 }, { "name": "model.layers.6.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.469273898801475e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007232431089505553, "sensitivity": 0.5019334423065391 }, { "name": "model.layers.6.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0180729077546857e-05, "sensitivity": 1.3075928298156805 }, { "name": "model.layers.6.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.936708132343483e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006528365192934871, "sensitivity": 0.5297076561069719 }, { "name": "model.layers.6.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.565343235502951e-05, "sensitivity": 0.7201308727265029 }, { "name": "model.layers.6.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.929150006522832e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006655083852820098, "sensitivity": 0.5398736213827701 }, { "name": "model.layers.6.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006868256605230272, "sensitivity": 0.519030146800292 }, { "name": "model.layers.6.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.453734613387496e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007280096760950983, "sensitivity": 0.5254971861095359 }, { "name": "model.layers.6.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.830052396049723e-05, "sensitivity": 0.6540282437817707 }, { "name": "model.layers.6.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.966799108136911e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006757627124898136, "sensitivity": 0.5482891702613181 }, { "name": "model.layers.6.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.77673563384451e-05, "sensitivity": 0.9741345558962546 }, { "name": "model.layers.6.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.235218279471155e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006719117518514395, "sensitivity": 0.5577829679811837 }, { "name": "model.layers.6.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0213829227723181e-05, "sensitivity": 1.4861117726056752 }, { "name": "model.layers.6.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.984256515352172e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.011313234921545e-05, "sensitivity": 0.8173159094697566 }, { "name": "model.layers.6.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6362623581662774e-05, "sensitivity": 0.9968345576375092 }, { "name": "model.layers.6.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.013241318214568e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006609484553337097, "sensitivity": 0.5586074782808822 }, { "name": "model.layers.6.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.694651554222219e-05, "sensitivity": 0.6020355788342076 }, { "name": "model.layers.6.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.179500360303791e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007028586114756763, "sensitivity": 0.5413638404227371 }, { "name": "model.layers.6.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5556942243129015e-05, "sensitivity": 0.820427356341269 }, { "name": "model.layers.6.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.890008196729468e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006654657190665603, "sensitivity": 0.5257731627154053 }, { "name": "model.layers.6.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.626984057016671e-05, "sensitivity": 0.8588157248540575 }, { "name": "model.layers.6.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.207333171914797e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006917174905538559, "sensitivity": 0.5284698706145263 }, { "name": "model.layers.6.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.419144144980237e-05, "sensitivity": 1.1337131833487177 }, { "name": "model.layers.6.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.86152282266994e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006482896278612316, "sensitivity": 0.5481658534158259 }, { "name": "model.layers.6.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.694383798982017e-05, "sensitivity": 0.6281391973043511 }, { "name": "model.layers.6.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.640837343889871e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006447023479267955, "sensitivity": 0.527591806791504 }, { "name": "model.layers.6.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.457294173538685e-05, "sensitivity": 0.7064950473669898 }, { "name": "model.layers.6.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.727168854718911e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006333797937259078, "sensitivity": 0.5364980987689366 }, { "name": "model.layers.6.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0000441761803813e-05, "sensitivity": 1.2751642967599524 }, { "name": "model.layers.6.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.555439995281631e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.0630456017679535e-05, "sensitivity": 1.2249667298009408 }, { "name": "model.layers.6.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.912419146625325e-05, "sensitivity": 1.0389221255457723 }, { "name": "model.layers.6.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.088516215640993e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006984553183428943, "sensitivity": 0.5285616740386496 }, { "name": "model.layers.6.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006383167929016054, "sensitivity": 0.5639585703445329 }, { "name": "model.layers.6.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.091443651712325e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006784825818613172, "sensitivity": 0.5501404759866451 }, { "name": "model.layers.6.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.370170038077049e-05, "sensitivity": 0.733994129798322 }, { "name": "model.layers.6.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.828340476909943e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006538236048072577, "sensitivity": 0.5431231251981703 }, { "name": "model.layers.6.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0326089977752417e-05, "sensitivity": 1.4977216942356018 }, { "name": "model.layers.6.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.823808351124171e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006560046458616853, "sensitivity": 0.5076706554567496 }, { "name": "model.layers.6.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0339149058563635e-05, "sensitivity": 0.7162884799869463 }, { "name": "model.layers.6.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.269820005400106e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007013003341853619, "sensitivity": 0.5178252041083931 }, { "name": "model.layers.6.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006524806376546621, "sensitivity": 0.5374168813636166 }, { "name": "model.layers.6.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.919238788010261e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000682905490975827, "sensitivity": 0.524269699434542 }, { "name": "model.layers.6.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6832825066521764e-05, "sensitivity": 0.9280927405690907 }, { "name": "model.layers.6.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.225106972124195e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006909620715305209, "sensitivity": 0.5305612992119594 }, { "name": "model.layers.6.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3570511227007955e-05, "sensitivity": 1.132196602487088 }, { "name": "model.layers.6.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.716884174944425e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006345995934680104, "sensitivity": 0.5375532804240135 }, { "name": "model.layers.6.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0937159458990209e-05, "sensitivity": 1.7507448239850112 }, { "name": "model.layers.6.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.301999633251398e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007088084239512682, "sensitivity": 0.5321531900838443 }, { "name": "model.layers.6.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.553107621381059e-05, "sensitivity": 0.7784711585086197 }, { "name": "model.layers.6.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.178356670716312e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006693013710901141, "sensitivity": 0.5228456258546624 }, { "name": "model.layers.6.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.487708403961733e-05, "sensitivity": 0.7568763462491285 }, { "name": "model.layers.6.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.931458417762769e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006566282245330513, "sensitivity": 0.5339737452275339 }, { "name": "model.layers.6.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006470398511737585, "sensitivity": 0.5578504382031609 }, { "name": "model.layers.6.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.054380037312512e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006846371106803417, "sensitivity": 0.5201100449394973 }, { "name": "model.layers.6.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7614735851529986e-05, "sensitivity": 0.9849311333229777 }, { "name": "model.layers.6.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.306955810941872e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.031420343788341e-05, "sensitivity": 0.623568544442872 }, { "name": "model.layers.6.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.880229582544416e-05, "sensitivity": 0.8209464388676091 }, { "name": "model.layers.6.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.233018439161242e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007049901178106666, "sensitivity": 0.5138082631252385 }, { "name": "model.layers.6.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5708449508529156e-05, "sensitivity": 0.8073737087595007 }, { "name": "model.layers.6.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.222611546036205e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000673370435833931, "sensitivity": 0.5701522969928297 }, { "name": "model.layers.6.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.498591053765267e-05, "sensitivity": 0.6405688580230897 }, { "name": "model.layers.6.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.075684382267355e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006615861784666777, "sensitivity": 0.5269150957024943 }, { "name": "model.layers.6.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4644286137772724e-05, "sensitivity": 0.9695087254359768 }, { "name": "model.layers.6.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.750279115090962e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006405391031876206, "sensitivity": 0.5251737866005454 }, { "name": "model.layers.6.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.950443301117048e-05, "sensitivity": 0.8385405137928128 }, { "name": "model.layers.6.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.073083795854473e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006922497414052486, "sensitivity": 0.5444900050838899 }, { "name": "model.layers.6.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.785828034277074e-05, "sensitivity": 1.055375458936517 }, { "name": "model.layers.6.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.963331091152213e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006777415401302278, "sensitivity": 0.5340883278341996 }, { "name": "model.layers.6.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0380054492270574e-05, "sensitivity": 1.0292258736710809 }, { "name": "model.layers.6.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.362626550071582e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007096345070749521, "sensitivity": 0.5143366618039594 }, { "name": "model.layers.6.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.340871211956255e-05, "sensitivity": 0.9863218151020383 }, { "name": "model.layers.6.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.395532068381726e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6876531743910164e-05, "sensitivity": 0.6060369892020345 }, { "name": "model.layers.6.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006280107190832496, "sensitivity": 0.5775759466860291 }, { "name": "model.layers.6.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.714584858651506e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006474937545135617, "sensitivity": 0.5319294029995575 }, { "name": "model.layers.6.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006430996581912041, "sensitivity": 0.5406266256930873 }, { "name": "model.layers.6.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.015056328578794e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006772935157641768, "sensitivity": 0.5877906475182323 }, { "name": "model.layers.6.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.710066034225747e-05, "sensitivity": 0.7471953289717292 }, { "name": "model.layers.6.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.102657152950997e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000695804541464895, "sensitivity": 0.5094190887003807 }, { "name": "model.layers.6.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.48322859685868e-05, "sensitivity": 0.6224332152129305 }, { "name": "model.layers.6.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.083286621105799e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006729968590661883, "sensitivity": 0.52705711665244 }, { "name": "model.layers.6.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9344456531107426e-05, "sensitivity": 0.8243890275146544 }, { "name": "model.layers.6.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.108183470132644e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.217225745785981e-05, "sensitivity": 0.7626473875928069 }, { "name": "model.layers.6.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006600222550332546, "sensitivity": 0.5869058986582536 }, { "name": "model.layers.6.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.248729960134369e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007126370328478515, "sensitivity": 0.5391390231611126 }, { "name": "model.layers.6.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.878698620013893e-06, "sensitivity": 1.4005742678135402 }, { "name": "model.layers.6.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.750721356889699e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006429735803976655, "sensitivity": 0.518499441667112 }, { "name": "model.layers.6.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9441354096634313e-05, "sensitivity": 0.9900358644197229 }, { "name": "model.layers.6.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.228361826288165e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000695324910338968, "sensitivity": 0.5535241560125183 }, { "name": "model.layers.6.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.2797717216890305e-05, "sensitivity": 0.7821601836766932 }, { "name": "model.layers.6.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.645305805046519e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006292031612247229, "sensitivity": 0.5317107109072646 }, { "name": "model.layers.6.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.70462980249431e-05, "sensitivity": 0.7843891851529493 }, { "name": "model.layers.6.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.127181677584304e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.035942351445556e-05, "sensitivity": 0.7552309681678469 }, { "name": "model.layers.6.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.701258123735897e-05, "sensitivity": 0.777322376773594 }, { "name": "model.layers.6.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.342977485473966e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006784155848436058, "sensitivity": 0.5453614732023868 }, { "name": "model.layers.6.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.104051135480404e-05, "sensitivity": 0.6552720376763157 }, { "name": "model.layers.6.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.449205329772667e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007276737014763057, "sensitivity": 0.5359690795662718 }, { "name": "model.layers.6.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4772041039541364e-05, "sensitivity": 0.7795287821969561 }, { "name": "model.layers.6.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.916089094171184e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006677813362330198, "sensitivity": 0.5100133354152152 }, { "name": "model.layers.6.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006660979706794024, "sensitivity": 0.5313935921410139 }, { "name": "model.layers.6.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.150789886305574e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006914662080816925, "sensitivity": 0.5266513399673843 }, { "name": "model.layers.6.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.164110189070925e-05, "sensitivity": 1.1958459195665665 }, { "name": "model.layers.6.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.426354618975893e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.351617801352404e-05, "sensitivity": 0.622156211956137 }, { "name": "model.layers.6.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.663411502609961e-05, "sensitivity": 0.7844660401844595 }, { "name": "model.layers.6.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.103801410972665e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006890061195008457, "sensitivity": 0.5180957369779712 }, { "name": "model.layers.6.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.890367538086139e-05, "sensitivity": 0.8524389334413824 }, { "name": "model.layers.6.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.897919320181245e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.284908158704638e-05, "sensitivity": 0.9959739133078523 }, { "name": "model.layers.6.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8093206462217495e-05, "sensitivity": 0.9243585035991819 }, { "name": "model.layers.6.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.171907216412365e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006913856486789882, "sensitivity": 0.5103035851714822 }, { "name": "model.layers.6.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0311521691619419e-05, "sensitivity": 1.314706545458852 }, { "name": "model.layers.6.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.090200486141839e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9573583712335676e-05, "sensitivity": 0.9498941371847344 }, { "name": "model.layers.6.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006669365102425218, "sensitivity": 0.5035688116671737 }, { "name": "model.layers.6.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.172177791086142e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00070140918251127, "sensitivity": 0.5065843335969656 }, { "name": "model.layers.6.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.02882937528193e-05, "sensitivity": 0.8835380925921081 }, { "name": "model.layers.6.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.205243039403285e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007065918180160224, "sensitivity": 0.5184654004137565 }, { "name": "model.layers.6.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7779743656283244e-05, "sensitivity": 0.9903254808522901 }, { "name": "model.layers.6.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.340029585771845e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.092302646720782e-05, "sensitivity": 0.6699571374582189 }, { "name": "model.layers.6.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.622508979286067e-05, "sensitivity": 0.9817457293655094 }, { "name": "model.layers.6.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.984146239119582e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.988773045828566e-05, "sensitivity": 0.8908818072382368 }, { "name": "model.layers.6.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.633967521134764e-05, "sensitivity": 0.6377902469572438 }, { "name": "model.layers.6.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.733494958803931e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006563730421476066, "sensitivity": 0.551345801704431 }, { "name": "model.layers.6.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006390023627318442, "sensitivity": 0.5212106278020271 }, { "name": "model.layers.6.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.995547098791576e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006774008506909013, "sensitivity": 0.5079884126487787 }, { "name": "model.layers.6.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.43172427569516e-05, "sensitivity": 1.182943807113232 }, { "name": "model.layers.6.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.889531848879415e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006475000409409404, "sensitivity": 0.5494417532154581 }, { "name": "model.layers.6.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 9.630176464270335e-06, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.964664534170879e-06, "sensitivity": 2.099288426383133 }, { "name": "model.layers.6.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.62519925703964e-07, "sensitivity": 10.0 }, { "name": "model.layers.6.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.3236229960966739e-06, "sensitivity": 2.10155937077606 }, { "name": "model.layers.6.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 8.352782970177941e-06, "sensitivity": 2.148186083435637 }, { "name": "model.layers.6.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.0001912114821607247, "sensitivity": 0.9471759698748046 }, { "name": "model.layers.6.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.195357344840886e-05, "sensitivity": 1.7497405766493983 }, { "name": "model.layers.6.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 2, "mse": 0.0005293141584843397, "sensitivity": 0.5548273876801484 }, { "name": "model.layers.6.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0003165740636177361, "sensitivity": 0.7335503835102731 }, { "name": "model.layers.7.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006285854615271091, "sensitivity": 0.5310993728027205 }, { "name": "model.layers.7.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.447576197388116e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006641258951276541, "sensitivity": 0.5080962802791482 }, { "name": "model.layers.7.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006640524370595813, "sensitivity": 0.5782057171300815 }, { "name": "model.layers.7.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.376430974341929e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006968459929339588, "sensitivity": 0.5164425281865961 }, { "name": "model.layers.7.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7069682952715084e-05, "sensitivity": 0.8975566990839071 }, { "name": "model.layers.7.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.024205158108089e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9771304222522303e-05, "sensitivity": 0.8117419753727988 }, { "name": "model.layers.7.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006029325304552913, "sensitivity": 0.5764435035328658 }, { "name": "model.layers.7.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.068990501262306e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006262838141992688, "sensitivity": 0.5369736942721245 }, { "name": "model.layers.7.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006223347736522555, "sensitivity": 0.5499916206014084 }, { "name": "model.layers.7.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.320382794910984e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006522891926579177, "sensitivity": 0.5161741146764348 }, { "name": "model.layers.7.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.621020682156086e-05, "sensitivity": 0.6750991206741357 }, { "name": "model.layers.7.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.090490387578029e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000662352133076638, "sensitivity": 0.5616967397200032 }, { "name": "model.layers.7.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0005698543973267078, "sensitivity": 0.515806391900241 }, { "name": "model.layers.7.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.74806222175539e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005827447166666389, "sensitivity": 0.5205471550745862 }, { "name": "model.layers.7.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006065201014280319, "sensitivity": 0.5257249701852521 }, { "name": "model.layers.7.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.425466381188016e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006201675860211253, "sensitivity": 0.511119882041758 }, { "name": "model.layers.7.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006469734362326562, "sensitivity": 0.5593799943639299 }, { "name": "model.layers.7.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.785537950941944e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.836343552800827e-05, "sensitivity": 0.6318491492464338 }, { "name": "model.layers.7.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.442996189231053e-05, "sensitivity": 0.745233893538501 }, { "name": "model.layers.7.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.126750460884068e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006572717684321105, "sensitivity": 0.5149819813909353 }, { "name": "model.layers.7.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3967873100191355e-05, "sensitivity": 0.6156906464052111 }, { "name": "model.layers.7.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.125473532847536e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000627335102763027, "sensitivity": 0.535252967386026 }, { "name": "model.layers.7.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.757100734626874e-05, "sensitivity": 0.8761712667416477 }, { "name": "model.layers.7.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.041139499757264e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.930274710408412e-05, "sensitivity": 0.9952726601827502 }, { "name": "model.layers.7.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.905101716052741e-05, "sensitivity": 0.8879450170409352 }, { "name": "model.layers.7.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.086734174459707e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000679867691360414, "sensitivity": 0.5254144425744017 }, { "name": "model.layers.7.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3572577598970383e-05, "sensitivity": 0.9633124593086229 }, { "name": "model.layers.7.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.097706659602409e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006082457257434726, "sensitivity": 0.5193063007857501 }, { "name": "model.layers.7.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006285907002165914, "sensitivity": 0.5633618944599837 }, { "name": "model.layers.7.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.27945212272607e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000658623524941504, "sensitivity": 0.5184510081125105 }, { "name": "model.layers.7.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.320418858900666e-05, "sensitivity": 0.7741428341314598 }, { "name": "model.layers.7.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.202477038641518e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006198523915372789, "sensitivity": 0.5227557037997002 }, { "name": "model.layers.7.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006607719697058201, "sensitivity": 0.5452936589513004 }, { "name": "model.layers.7.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.224267394827621e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000685474369674921, "sensitivity": 0.5473994170091947 }, { "name": "model.layers.7.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006232651649042964, "sensitivity": 0.5216011769475168 }, { "name": "model.layers.7.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.708109256374883e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006373918149620295, "sensitivity": 0.5332486671927286 }, { "name": "model.layers.7.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006178590701892972, "sensitivity": 0.5356794477236101 }, { "name": "model.layers.7.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.91638467994926e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006372565403580666, "sensitivity": 0.5110441525481961 }, { "name": "model.layers.7.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006563399801962078, "sensitivity": 0.5305169593599866 }, { "name": "model.layers.7.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.22909453795728e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006735686911270022, "sensitivity": 0.5718369576604401 }, { "name": "model.layers.7.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006305986316874623, "sensitivity": 0.5407849120417311 }, { "name": "model.layers.7.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.784040920138068e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006973372073844075, "sensitivity": 0.536066120320605 }, { "name": "model.layers.7.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.2947936637792736e-05, "sensitivity": 0.7120341009212721 }, { "name": "model.layers.7.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.748214562117937e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006042728200554848, "sensitivity": 0.598791782775763 }, { "name": "model.layers.7.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.00067484425380826, "sensitivity": 0.5215289497863066 }, { "name": "model.layers.7.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.100860900914995e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006893902900628746, "sensitivity": 0.5142864567494745 }, { "name": "model.layers.7.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0694492276525125e-05, "sensitivity": 0.8798884148767407 }, { "name": "model.layers.7.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.28857151241391e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006994563154876232, "sensitivity": 0.5062024609965204 }, { "name": "model.layers.7.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006136137526482344, "sensitivity": 0.5250660870440428 }, { "name": "model.layers.7.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.944368695054436e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006413794471882284, "sensitivity": 0.532511765117314 }, { "name": "model.layers.7.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006245156982913613, "sensitivity": 0.5549763933628472 }, { "name": "model.layers.7.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.02846114361455e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006381713901646435, "sensitivity": 0.5765319853734985 }, { "name": "model.layers.7.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006523056654259562, "sensitivity": 0.5394926827956099 }, { "name": "model.layers.7.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.022107186254289e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006677209166809916, "sensitivity": 0.5081719791904447 }, { "name": "model.layers.7.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.2672676247311756e-05, "sensitivity": 0.7023803996417274 }, { "name": "model.layers.7.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.966178378002951e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000613968470133841, "sensitivity": 0.509538924474834 }, { "name": "model.layers.7.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9514917666092515e-05, "sensitivity": 0.9466116829131508 }, { "name": "model.layers.7.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.922008424226078e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.293143087532371e-05, "sensitivity": 0.9357820668990922 }, { "name": "model.layers.7.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4547588661080226e-05, "sensitivity": 0.6810597278357804 }, { "name": "model.layers.7.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.753337291025673e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006251310696825385, "sensitivity": 0.5427773139220692 }, { "name": "model.layers.7.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006676516495645046, "sensitivity": 0.5097786040760139 }, { "name": "model.layers.7.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.105659622335224e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006871768273413181, "sensitivity": 0.5393581981447233 }, { "name": "model.layers.7.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006878719432279468, "sensitivity": 0.5412768239939789 }, { "name": "model.layers.7.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.376246233230631e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007092603482306004, "sensitivity": 0.5460815960660529 }, { "name": "model.layers.7.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006594952428713441, "sensitivity": 0.5409136938806953 }, { "name": "model.layers.7.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.183691994010587e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006779811228625476, "sensitivity": 0.5394284544783012 }, { "name": "model.layers.7.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006077652797102928, "sensitivity": 0.5681887768135615 }, { "name": "model.layers.7.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.937930609434261e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006304677808657289, "sensitivity": 0.5626774963479028 }, { "name": "model.layers.7.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000583465036470443, "sensitivity": 0.5310164411986447 }, { "name": "model.layers.7.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.941923291175044e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005987006006762385, "sensitivity": 0.5157500709252083 }, { "name": "model.layers.7.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006480964366346598, "sensitivity": 0.5532745676280008 }, { "name": "model.layers.7.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.923961907683406e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006657079793512821, "sensitivity": 0.5043441267885894 }, { "name": "model.layers.7.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0005948141915723681, "sensitivity": 0.5343164205993178 }, { "name": "model.layers.7.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.224989874681341e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006149043329060078, "sensitivity": 0.5055429558804372 }, { "name": "model.layers.7.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006247260607779026, "sensitivity": 0.5251525898222954 }, { "name": "model.layers.7.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.080761636440002e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006448737112805247, "sensitivity": 0.5026840189912501 }, { "name": "model.layers.7.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000691444322001189, "sensitivity": 0.5196842547104007 }, { "name": "model.layers.7.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.321248520180234e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007137682987377048, "sensitivity": 0.5210010515283658 }, { "name": "model.layers.7.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.530188718694262e-05, "sensitivity": 0.9902766845988619 }, { "name": "model.layers.7.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.122626245996798e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.0459024451847654e-05, "sensitivity": 1.3938075003891899 }, { "name": "model.layers.7.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.262839113129303e-05, "sensitivity": 0.8447448845819387 }, { "name": "model.layers.7.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.046453672250209e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7180150179192424e-05, "sensitivity": 0.6123032511132258 }, { "name": "model.layers.7.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.180983397527598e-06, "sensitivity": 1.6384968360111527 }, { "name": "model.layers.7.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.981732217856916e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 4.899902705801651e-05, "sensitivity": 0.6367923889416511 }, { "name": "model.layers.7.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0005781640065833926, "sensitivity": 0.5694742991825216 }, { "name": "model.layers.7.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.534957037729328e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006030923686921597, "sensitivity": 0.543575286001677 }, { "name": "model.layers.7.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006182952784001827, "sensitivity": 0.5119318748700965 }, { "name": "model.layers.7.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.175154680931882e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006352817872539163, "sensitivity": 0.5053912596767034 }, { "name": "model.layers.7.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006501011084765196, "sensitivity": 0.5807559347150961 }, { "name": "model.layers.7.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.200350526341936e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006893409881740808, "sensitivity": 0.547014743154823 }, { "name": "model.layers.7.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.223013770068064e-05, "sensitivity": 0.7655969219435699 }, { "name": "model.layers.7.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.577503768312454e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.473549001384526e-05, "sensitivity": 0.7149468640836616 }, { "name": "model.layers.7.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006258563371375203, "sensitivity": 0.5614970477110153 }, { "name": "model.layers.7.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.327466053335229e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006608895491808653, "sensitivity": 0.5059851314193357 }, { "name": "model.layers.7.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 4.9284688429906964e-05, "sensitivity": 0.6242470071276273 }, { "name": "model.layers.7.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.758804491051706e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005810059374198318, "sensitivity": 0.5304641882622053 }, { "name": "model.layers.7.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006409158231690526, "sensitivity": 0.52007242752223 }, { "name": "model.layers.7.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.767709012616251e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006499758455902338, "sensitivity": 0.5470332531456726 }, { "name": "model.layers.7.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006489385850727558, "sensitivity": 0.5341065266454442 }, { "name": "model.layers.7.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.824073241456063e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006563173374161124, "sensitivity": 0.5184510587649622 }, { "name": "model.layers.7.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0005940558621659875, "sensitivity": 0.564641868464315 }, { "name": "model.layers.7.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.878320052943309e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006118664750829339, "sensitivity": 0.516188361481141 }, { "name": "model.layers.7.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.670772952726111e-05, "sensitivity": 0.8239068891397434 }, { "name": "model.layers.7.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.631792868778575e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.916252848692238e-05, "sensitivity": 0.8230172959609515 }, { "name": "model.layers.7.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.515339944395237e-05, "sensitivity": 0.7256142963450841 }, { "name": "model.layers.7.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.010852189319849e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006432951777242124, "sensitivity": 0.5719986801814403 }, { "name": "model.layers.7.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.807237175758928e-05, "sensitivity": 0.9559897274926421 }, { "name": "model.layers.7.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.611430194425338e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.170984852360561e-05, "sensitivity": 0.6882206994915674 }, { "name": "model.layers.7.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006209976854734123, "sensitivity": 0.5993704581952555 }, { "name": "model.layers.7.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.899096322536934e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006341019761748612, "sensitivity": 0.5154432044515128 }, { "name": "model.layers.7.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.334527668310329e-05, "sensitivity": 0.9363057021416219 }, { "name": "model.layers.7.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.149631417429191e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006283801048994064, "sensitivity": 0.5856551437308297 }, { "name": "model.layers.7.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006587802199646831, "sensitivity": 0.5210429953967187 }, { "name": "model.layers.7.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.843808139616158e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006650366703979671, "sensitivity": 0.5137982146963058 }, { "name": "model.layers.7.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.1963605073979124e-05, "sensitivity": 0.7718800756993212 }, { "name": "model.layers.7.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.133323608992214e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006031547673046589, "sensitivity": 0.5286565722351834 }, { "name": "model.layers.7.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006020166911184788, "sensitivity": 0.533673197915718 }, { "name": "model.layers.7.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.058327812752395e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006213050801306963, "sensitivity": 0.5524937455667661 }, { "name": "model.layers.7.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0005951565690338612, "sensitivity": 0.5416044331236166 }, { "name": "model.layers.7.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.130318297437043e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006094466662034392, "sensitivity": 0.5632248810922657 }, { "name": "model.layers.7.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006791501073166728, "sensitivity": 0.5309201144935458 }, { "name": "model.layers.7.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.384852895280346e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007062609656713903, "sensitivity": 0.5333888521610165 }, { "name": "model.layers.7.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006312994519248605, "sensitivity": 0.5260884489707879 }, { "name": "model.layers.7.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.266782293096185e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006621097563765943, "sensitivity": 0.532186872122935 }, { "name": "model.layers.7.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.972676783334464e-05, "sensitivity": 0.8137120805645387 }, { "name": "model.layers.7.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.707723739258654e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.391469262074679e-05, "sensitivity": 0.6769786451837005 }, { "name": "model.layers.7.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.745067755924538e-05, "sensitivity": 0.6389059848053901 }, { "name": "model.layers.7.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.976704642307595e-07, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006662673549726605, "sensitivity": 0.5775857846877668 }, { "name": "model.layers.7.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 7.649958206457086e-06, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.6349338238796918e-06, "sensitivity": 2.0986139397860346 }, { "name": "model.layers.7.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5512343907175818e-06, "sensitivity": 10.0 }, { "name": "model.layers.7.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.3129277931511751e-06, "sensitivity": 2.102411012204769 }, { "name": "model.layers.7.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 6.294727882050211e-06, "sensitivity": 2.1673653507053268 }, { "name": "model.layers.7.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00017241756722796708, "sensitivity": 0.9429004640685459 }, { "name": "model.layers.7.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.210101709148148e-05, "sensitivity": 1.681226268566732 }, { "name": "model.layers.7.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.466004222398624e-05, "sensitivity": 0.8648010873352465 }, { "name": "model.layers.7.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002621706807985902, "sensitivity": 0.7031955177702383 }, { "name": "model.layers.8.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.2615861932281405e-05, "sensitivity": 1.0870864895074375 }, { "name": "model.layers.8.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.71673126614769e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006042394088581204, "sensitivity": 0.5354667329338789 }, { "name": "model.layers.8.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8776262449100614e-05, "sensitivity": 1.1208821085470697 }, { "name": "model.layers.8.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.192186674525146e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006728253792971373, "sensitivity": 0.5221069142246312 }, { "name": "model.layers.8.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.698503809981048e-05, "sensitivity": 1.0001111275081294 }, { "name": "model.layers.8.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.974013674858725e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006704336847178638, "sensitivity": 0.537348433212655 }, { "name": "model.layers.8.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5173917644424364e-05, "sensitivity": 1.1093296374998443 }, { "name": "model.layers.8.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.176166493787605e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8998397435061634e-05, "sensitivity": 1.14767346226784 }, { "name": "model.layers.8.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.240125392447226e-05, "sensitivity": 1.0518087570225123 }, { "name": "model.layers.8.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.312615141723654e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006098603480495512, "sensitivity": 0.5841426661691032 }, { "name": "model.layers.8.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.773860539193265e-05, "sensitivity": 1.1803098653343007 }, { "name": "model.layers.8.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.130306928753271e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006631077267229557, "sensitivity": 0.5281308868041266 }, { "name": "model.layers.8.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006219181232154369, "sensitivity": 0.5448575134703897 }, { "name": "model.layers.8.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.065719730941055e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006442638114094734, "sensitivity": 0.5163258204083999 }, { "name": "model.layers.8.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006509541999548674, "sensitivity": 0.5348275117185777 }, { "name": "model.layers.8.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.091271416153177e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006741936085745692, "sensitivity": 0.553265314663232 }, { "name": "model.layers.8.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.2279477889242116e-06, "sensitivity": 2.0936203262295447 }, { "name": "model.layers.8.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.948573971181759e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006497274152934551, "sensitivity": 0.5442129085270528 }, { "name": "model.layers.8.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.729049735236913e-05, "sensitivity": 0.6627473443456809 }, { "name": "model.layers.8.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.427906100725522e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006833620718680322, "sensitivity": 0.5153162217033116 }, { "name": "model.layers.8.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3337029385147616e-05, "sensitivity": 1.1944379680014738 }, { "name": "model.layers.8.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.457540055431309e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000617503363173455, "sensitivity": 0.5215921319261468 }, { "name": "model.layers.8.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006874331156723201, "sensitivity": 0.547134638676166 }, { "name": "model.layers.8.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.31044827059668e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007019065087661147, "sensitivity": 0.5407603430707841 }, { "name": "model.layers.8.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007055179448798299, "sensitivity": 0.509056930905724 }, { "name": "model.layers.8.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.370489700202597e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007130267913453281, "sensitivity": 0.5299646684344438 }, { "name": "model.layers.8.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.760023486800492e-05, "sensitivity": 0.7655253291219766 }, { "name": "model.layers.8.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.333998499030713e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006734055350534618, "sensitivity": 0.5313576787216745 }, { "name": "model.layers.8.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.859709199285135e-05, "sensitivity": 0.6564524297873104 }, { "name": "model.layers.8.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.192334467414184e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006772982887923717, "sensitivity": 0.5499775389976215 }, { "name": "model.layers.8.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.165255035739392e-05, "sensitivity": 0.6146048110680012 }, { "name": "model.layers.8.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.317042107184534e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007042891811579466, "sensitivity": 0.5256339487359742 }, { "name": "model.layers.8.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4848482250235975e-05, "sensitivity": 0.8404102707559693 }, { "name": "model.layers.8.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.936523734817456e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006279231747612357, "sensitivity": 0.5531278251441654 }, { "name": "model.layers.8.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006110720569267869, "sensitivity": 0.552693974372499 }, { "name": "model.layers.8.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.758219003837439e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006288491422310472, "sensitivity": 0.5307159805522311 }, { "name": "model.layers.8.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.245471119356807e-06, "sensitivity": 1.6728180954190464 }, { "name": "model.layers.8.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.183159714761132e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005736150778830051, "sensitivity": 0.5123850143719645 }, { "name": "model.layers.8.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4242682381300256e-05, "sensitivity": 0.7190858800906638 }, { "name": "model.layers.8.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.312208711278799e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000634278345387429, "sensitivity": 0.5346459488169297 }, { "name": "model.layers.8.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.162719753570855e-05, "sensitivity": 0.8321288206884722 }, { "name": "model.layers.8.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.777491765002196e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006078301230445504, "sensitivity": 0.5107739932094367 }, { "name": "model.layers.8.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.4775441539241e-06, "sensitivity": 1.2515247870830233 }, { "name": "model.layers.8.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.796049435957684e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005979108391329646, "sensitivity": 0.5518671864699555 }, { "name": "model.layers.8.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.914230132475495e-05, "sensitivity": 0.6897979349771116 }, { "name": "model.layers.8.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.262265515033505e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006954871350899339, "sensitivity": 0.5276448124586104 }, { "name": "model.layers.8.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0355888662161306e-05, "sensitivity": 1.573219285400514 }, { "name": "model.layers.8.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.686907679271826e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.097659934312105e-05, "sensitivity": 0.8977643342601819 }, { "name": "model.layers.8.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.843246981385164e-05, "sensitivity": 0.7647439647580461 }, { "name": "model.layers.8.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.194605361997674e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006755664362572134, "sensitivity": 0.5012576828982775 }, { "name": "model.layers.8.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006658685160800815, "sensitivity": 0.5599304851481322 }, { "name": "model.layers.8.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.972873395876377e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006737681105732918, "sensitivity": 0.5411090158500438 }, { "name": "model.layers.8.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.498531390912831e-05, "sensitivity": 0.727280634469451 }, { "name": "model.layers.8.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.195393211783085e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006391379865817726, "sensitivity": 0.5202342725427327 }, { "name": "model.layers.8.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0801223652379122e-05, "sensitivity": 1.6465826212871875 }, { "name": "model.layers.8.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.28692987447721e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006823057774454355, "sensitivity": 0.5502517326140575 }, { "name": "model.layers.8.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.072902422398329e-05, "sensitivity": 0.7868710018713755 }, { "name": "model.layers.8.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.603196993637539e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.318496187101118e-05, "sensitivity": 0.831806749699856 }, { "name": "model.layers.8.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9270067140460014e-05, "sensitivity": 0.9470221606314492 }, { "name": "model.layers.8.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.432395250361878e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.219906936166808e-05, "sensitivity": 0.8204530712264315 }, { "name": "model.layers.8.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006307018920779228, "sensitivity": 0.5663031113229271 }, { "name": "model.layers.8.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.742139705944282e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006404279265552759, "sensitivity": 0.5307843520907931 }, { "name": "model.layers.8.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.58365645701997e-05, "sensitivity": 1.1183224216942202 }, { "name": "model.layers.8.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.070342806197004e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.798276833957061e-05, "sensitivity": 0.8440855514090759 }, { "name": "model.layers.8.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0085102985613048e-05, "sensitivity": 1.2701799638893685 }, { "name": "model.layers.8.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.140813522710232e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7542521972209215e-05, "sensitivity": 0.7488112866076663 }, { "name": "model.layers.8.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006910294177941978, "sensitivity": 0.559079180395661 }, { "name": "model.layers.8.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.15346266386041e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006978041492402554, "sensitivity": 0.5307955675491723 }, { "name": "model.layers.8.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.559723649639636e-05, "sensitivity": 1.0546937672746093 }, { "name": "model.layers.8.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.614859557885211e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.779845378128812e-05, "sensitivity": 0.89047466188325 }, { "name": "model.layers.8.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.977266118861735e-05, "sensitivity": 1.0050705665239508 }, { "name": "model.layers.8.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.437505248868547e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006848713383078575, "sensitivity": 0.5740453052245409 }, { "name": "model.layers.8.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.326051905285567e-05, "sensitivity": 0.7484268151532476 }, { "name": "model.layers.8.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.179761840030551e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006288717268034816, "sensitivity": 0.5527154260571621 }, { "name": "model.layers.8.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8454064856050536e-05, "sensitivity": 0.7150786705779367 }, { "name": "model.layers.8.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.407811952158227e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000684408179949969, "sensitivity": 0.5188308214639701 }, { "name": "model.layers.8.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.666171637130901e-05, "sensitivity": 0.8822320043884101 }, { "name": "model.layers.8.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.788373869108909e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006405941094271839, "sensitivity": 0.5391685193444248 }, { "name": "model.layers.8.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006878252024762332, "sensitivity": 0.5173512870683591 }, { "name": "model.layers.8.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.281061928348208e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000707612547557801, "sensitivity": 0.5104118713880513 }, { "name": "model.layers.8.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000649136258289218, "sensitivity": 0.5583637286815685 }, { "name": "model.layers.8.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.365065701174899e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006790678016841412, "sensitivity": 0.5398701870808521 }, { "name": "model.layers.8.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9970432630507275e-05, "sensitivity": 0.9824354208034521 }, { "name": "model.layers.8.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.219751753633318e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006898745778016746, "sensitivity": 0.5412851817838814 }, { "name": "model.layers.8.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6241173297166824e-05, "sensitivity": 0.7749969915339826 }, { "name": "model.layers.8.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.167048240968143e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006554393912665546, "sensitivity": 0.5367211935859852 }, { "name": "model.layers.8.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006598454201593995, "sensitivity": 0.5767583721453159 }, { "name": "model.layers.8.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.24120730208233e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006748183513991535, "sensitivity": 0.5080155172363683 }, { "name": "model.layers.8.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.905385478399694e-05, "sensitivity": 0.665856271178344 }, { "name": "model.layers.8.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.957725761618349e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006658464553765953, "sensitivity": 0.5192218125290777 }, { "name": "model.layers.8.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.040451262379065e-05, "sensitivity": 0.6523308956975519 }, { "name": "model.layers.8.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.145505722088274e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006948718801140785, "sensitivity": 0.5360621632377598 }, { "name": "model.layers.8.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.825726839248091e-05, "sensitivity": 0.6912991033709895 }, { "name": "model.layers.8.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.398983600774955e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006741941324435174, "sensitivity": 0.539443096116127 }, { "name": "model.layers.8.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.959940608590841e-05, "sensitivity": 0.7522959247385123 }, { "name": "model.layers.8.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.98943188379053e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006651740404777229, "sensitivity": 0.5473037128540261 }, { "name": "model.layers.8.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.221517105586827e-05, "sensitivity": 0.724214950955535 }, { "name": "model.layers.8.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.525741582663613e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007223885040730238, "sensitivity": 0.5175606066423489 }, { "name": "model.layers.8.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7800934882834554e-05, "sensitivity": 0.6747299438475869 }, { "name": "model.layers.8.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.372994221237605e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006738868542015553, "sensitivity": 0.5933618750715148 }, { "name": "model.layers.8.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3238123655319214e-05, "sensitivity": 0.9228794044449415 }, { "name": "model.layers.8.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.044552947059856e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006113721756264567, "sensitivity": 0.5482854844516507 }, { "name": "model.layers.8.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5096112191677094e-05, "sensitivity": 0.700575386381613 }, { "name": "model.layers.8.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.176052238515695e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006509938393719494, "sensitivity": 0.5001505586290487 }, { "name": "model.layers.8.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0683223081286997e-05, "sensitivity": 1.3304451987384829 }, { "name": "model.layers.8.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.227409130588057e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006682439125142992, "sensitivity": 0.5624404181209963 }, { "name": "model.layers.8.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.847525244462304e-05, "sensitivity": 1.0719372323265646 }, { "name": "model.layers.8.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.076325576032104e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006915838457643986, "sensitivity": 0.5337965375288557 }, { "name": "model.layers.8.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8641715440899134e-05, "sensitivity": 1.0080218464167219 }, { "name": "model.layers.8.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.538168915743881e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.243996904231608e-05, "sensitivity": 0.6987809043628073 }, { "name": "model.layers.8.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0298905181116425e-05, "sensitivity": 1.2494091619061605 }, { "name": "model.layers.8.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.099608640397491e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6786928325891495e-05, "sensitivity": 0.8416143552074654 }, { "name": "model.layers.8.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.216136923991144e-05, "sensitivity": 1.129060987784554 }, { "name": "model.layers.8.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.794286153104622e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006110165268182755, "sensitivity": 0.5246742407732686 }, { "name": "model.layers.8.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.284371193032712e-05, "sensitivity": 0.6055920122782452 }, { "name": "model.layers.8.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.036767328827409e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007521145744249225, "sensitivity": 0.5364995650687856 }, { "name": "model.layers.8.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.813846190809272e-06, "sensitivity": 1.457729745170581 }, { "name": "model.layers.8.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.755064194090664e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006191876600496471, "sensitivity": 0.5189783919067208 }, { "name": "model.layers.8.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.909351319947746e-06, "sensitivity": 1.2338806769986068 }, { "name": "model.layers.8.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.788973567177891e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006186409736983478, "sensitivity": 0.5417981469866897 }, { "name": "model.layers.8.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.886091821594164e-05, "sensitivity": 0.8216119413689545 }, { "name": "model.layers.8.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.148775580390065e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000699042109772563, "sensitivity": 0.5630105440949598 }, { "name": "model.layers.8.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.478312596096657e-05, "sensitivity": 0.7738089896257592 }, { "name": "model.layers.8.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.509608283522539e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006335486541502178, "sensitivity": 0.5344884353592708 }, { "name": "model.layers.8.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006579881301149726, "sensitivity": 0.5651262904664438 }, { "name": "model.layers.8.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.255388029785536e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006850508507341146, "sensitivity": 0.4983450460040795 }, { "name": "model.layers.8.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.771047653979622e-05, "sensitivity": 0.707014603468375 }, { "name": "model.layers.8.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.274342467804672e-07, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00067514757392928, "sensitivity": 0.5853513044069409 }, { "name": "model.layers.8.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 7.128865490813041e-06, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.9909907678083982e-06, "sensitivity": 2.0992466545881228 }, { "name": "model.layers.8.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.088238832380739e-06, "sensitivity": 10.0 }, { "name": "model.layers.8.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.2747664186463226e-06, "sensitivity": 2.103351951268362 }, { "name": "model.layers.8.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 5.40961445949506e-06, "sensitivity": 2.1476848864125913 }, { "name": "model.layers.8.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00016921942005865276, "sensitivity": 1.1521923221834178 }, { "name": "model.layers.8.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 5, "mse": 3.2878731417440576e-06, "sensitivity": 2.000065486914284 }, { "name": "model.layers.8.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 3.61978163709864e-05, "sensitivity": 0.6878365858430043 }, { "name": "model.layers.8.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 4, "mse": 5.29955759702716e-05, "sensitivity": 1.2480728559870202 }, { "name": "model.layers.9.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006718370132148266, "sensitivity": 0.5974981442462561 }, { "name": "model.layers.9.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.780824151064735e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007002022466622293, "sensitivity": 0.5281827566171818 }, { "name": "model.layers.9.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.816221528220922e-05, "sensitivity": 0.7601869078307271 }, { "name": "model.layers.9.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.991096827528963e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006589662516489625, "sensitivity": 0.499096140686669 }, { "name": "model.layers.9.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0736645536962897e-05, "sensitivity": 0.7739035022086147 }, { "name": "model.layers.9.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.385912456607912e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006955966237001121, "sensitivity": 0.5225135115829536 }, { "name": "model.layers.9.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5396863899659365e-05, "sensitivity": 0.6349225692132343 }, { "name": "model.layers.9.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.902896873521968e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006477205315604806, "sensitivity": 0.5493347837636049 }, { "name": "model.layers.9.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000625104526989162, "sensitivity": 0.5156217196632166 }, { "name": "model.layers.9.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.997364951326745e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000633592251688242, "sensitivity": 0.5147526078118756 }, { "name": "model.layers.9.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006583509966731071, "sensitivity": 0.5401188815949858 }, { "name": "model.layers.9.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.32187493465608e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000667195999994874, "sensitivity": 0.5483101137017716 }, { "name": "model.layers.9.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.472133489092812e-05, "sensitivity": 0.7656930838232505 }, { "name": "model.layers.9.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.747360205532459e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006091412506066263, "sensitivity": 0.5245120710668897 }, { "name": "model.layers.9.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006541299517266452, "sensitivity": 0.543969560658333 }, { "name": "model.layers.9.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.945041152699559e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006554305437020957, "sensitivity": 0.510493402187641 }, { "name": "model.layers.9.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0735583247151226e-05, "sensitivity": 0.812920110599862 }, { "name": "model.layers.9.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.248469842124905e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007019077311269939, "sensitivity": 0.5184826878285639 }, { "name": "model.layers.9.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.45048130536452e-05, "sensitivity": 0.777808666053188 }, { "name": "model.layers.9.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.927607500983868e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.561432383023202e-05, "sensitivity": 0.625946443004278 }, { "name": "model.layers.9.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.737854735343717e-05, "sensitivity": 1.0055944339674798 }, { "name": "model.layers.9.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.035924116076785e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006520358147099614, "sensitivity": 0.5394258112258008 }, { "name": "model.layers.9.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.815062831970863e-05, "sensitivity": 0.7639784608296054 }, { "name": "model.layers.9.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.213836059032474e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006421709549613297, "sensitivity": 0.5363253830341523 }, { "name": "model.layers.9.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 4.933826858177781e-05, "sensitivity": 1.1897185294931552 }, { "name": "model.layers.9.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.20947651239112e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005555971874855459, "sensitivity": 0.5312537666110428 }, { "name": "model.layers.9.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.498290920513682e-05, "sensitivity": 0.8193481454629192 }, { "name": "model.layers.9.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.786170618193864e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006118487799540162, "sensitivity": 0.5405327490428831 }, { "name": "model.layers.9.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 4.735418769996613e-05, "sensitivity": 1.1345636038083384 }, { "name": "model.layers.9.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.159403144716634e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 4.857263411395252e-05, "sensitivity": 0.6716076076525119 }, { "name": "model.layers.9.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.758404950029217e-05, "sensitivity": 0.6642522631264085 }, { "name": "model.layers.9.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.724800982738088e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006464474718086421, "sensitivity": 0.5102632889321557 }, { "name": "model.layers.9.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006569531979039311, "sensitivity": 0.5450408697676192 }, { "name": "model.layers.9.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.108036814111983e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006626536487601697, "sensitivity": 0.5272941325335221 }, { "name": "model.layers.9.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006700510857626796, "sensitivity": 0.5370812749656019 }, { "name": "model.layers.9.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.857401106368343e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006672595627605915, "sensitivity": 0.5508096439260771 }, { "name": "model.layers.9.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006799123948439956, "sensitivity": 0.5237648296316144 }, { "name": "model.layers.9.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.489742077064875e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006957825971767306, "sensitivity": 0.5163109781645167 }, { "name": "model.layers.9.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006354896468110383, "sensitivity": 0.5600641966688469 }, { "name": "model.layers.9.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.825729658681666e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006412089569494128, "sensitivity": 0.5377155656907076 }, { "name": "model.layers.9.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006639836356043816, "sensitivity": 0.5385051073340629 }, { "name": "model.layers.9.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.62295406073099e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006761080003343523, "sensitivity": 0.5982812623247226 }, { "name": "model.layers.9.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006710347952321172, "sensitivity": 0.5728549837555827 }, { "name": "model.layers.9.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.072683618185692e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006706896238029003, "sensitivity": 0.5171149340226308 }, { "name": "model.layers.9.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5865726608317345e-05, "sensitivity": 0.7072570216286294 }, { "name": "model.layers.9.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.863196292921202e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006323631387203932, "sensitivity": 0.5797507117229485 }, { "name": "model.layers.9.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006678564241155982, "sensitivity": 0.5271455393129687 }, { "name": "model.layers.9.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.085470545258431e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006675521726720035, "sensitivity": 0.5303883057855083 }, { "name": "model.layers.9.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6991899327840656e-05, "sensitivity": 0.7601300056525367 }, { "name": "model.layers.9.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.031857537891483e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000633547839242965, "sensitivity": 0.516982962070228 }, { "name": "model.layers.9.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007340325973927975, "sensitivity": 0.5340304243476248 }, { "name": "model.layers.9.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.962081897654571e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007695964886806905, "sensitivity": 0.5078994421381209 }, { "name": "model.layers.9.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006550386315211654, "sensitivity": 0.5377154142950005 }, { "name": "model.layers.9.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.90579134041036e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006528531666845083, "sensitivity": 0.5348849826268476 }, { "name": "model.layers.9.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.609393701888621e-05, "sensitivity": 0.8753976464267876 }, { "name": "model.layers.9.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.9379186723163e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006335391663014889, "sensitivity": 0.5351213469846751 }, { "name": "model.layers.9.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 2.1756079149781726e-05, "sensitivity": 0.7833321942620575 }, { "name": "model.layers.9.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3853144764652825e-06, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.547999070491642e-05, "sensitivity": 1.164623300766112 }, { "name": "model.layers.9.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006561711197718978, "sensitivity": 0.5272391993808697 }, { "name": "model.layers.9.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.782071070825623e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006604896625503898, "sensitivity": 0.5111338067878537 }, { "name": "model.layers.9.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.315493035595864e-05, "sensitivity": 1.0839796478668062 }, { "name": "model.layers.9.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.819899110472761e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.337941911420785e-05, "sensitivity": 1.1770380792568778 }, { "name": "model.layers.9.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006664553075097501, "sensitivity": 0.5148726810422262 }, { "name": "model.layers.9.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.161633336887462e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006714666960760951, "sensitivity": 0.5216714025316695 }, { "name": "model.layers.9.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006479392177425325, "sensitivity": 0.537111416048353 }, { "name": "model.layers.9.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.897651931263681e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006447885534726083, "sensitivity": 0.5256907768048952 }, { "name": "model.layers.9.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006379467085935175, "sensitivity": 0.5606197894323284 }, { "name": "model.layers.9.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.898794483982783e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006464140024036169, "sensitivity": 0.5160448963100829 }, { "name": "model.layers.9.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.646627687383443e-05, "sensitivity": 0.6637862779981396 }, { "name": "model.layers.9.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.753242930950364e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006488097715191543, "sensitivity": 0.5461852006546448 }, { "name": "model.layers.9.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006542066112160683, "sensitivity": 0.5028268773492732 }, { "name": "model.layers.9.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.983508799545234e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006546530639752746, "sensitivity": 0.5581315928798517 }, { "name": "model.layers.9.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006636198377236724, "sensitivity": 0.5288522595631724 }, { "name": "model.layers.9.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.312394589258474e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006760554388165474, "sensitivity": 0.5178451099215056 }, { "name": "model.layers.9.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.771277938038111e-05, "sensitivity": 0.6898596164861763 }, { "name": "model.layers.9.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.965943614683056e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.920344119658694e-05, "sensitivity": 0.6533553946745849 }, { "name": "model.layers.9.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.702349517378025e-05, "sensitivity": 0.6052258298862636 }, { "name": "model.layers.9.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.109018724804628e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8049423387274146e-05, "sensitivity": 0.9419921651697312 }, { "name": "model.layers.9.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006789787439629436, "sensitivity": 0.5596831470364378 }, { "name": "model.layers.9.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.626685262745013e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006933552213013172, "sensitivity": 0.5106485043591351 }, { "name": "model.layers.9.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006471562664955854, "sensitivity": 0.5271988432308534 }, { "name": "model.layers.9.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.836033665218565e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006467056809924543, "sensitivity": 0.5388931905143126 }, { "name": "model.layers.9.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.2778708525002e-05, "sensitivity": 0.6412159793331497 }, { "name": "model.layers.9.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.471129836427281e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007179678650572896, "sensitivity": 0.5418410978722 }, { "name": "model.layers.9.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006732097244821489, "sensitivity": 0.5330232195046056 }, { "name": "model.layers.9.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.288195208981051e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006925577181391418, "sensitivity": 0.5684843701598621 }, { "name": "model.layers.9.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006922517786733806, "sensitivity": 0.5101539018407268 }, { "name": "model.layers.9.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.402889312084881e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007053522276692092, "sensitivity": 0.5321877842075657 }, { "name": "model.layers.9.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.682798655470833e-05, "sensitivity": 0.8269258308350649 }, { "name": "model.layers.9.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.737448868283536e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.802429950563237e-05, "sensitivity": 1.0409294934526672 }, { "name": "model.layers.9.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006695526535622776, "sensitivity": 0.5547868347230887 }, { "name": "model.layers.9.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.325420827124617e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006943633197806776, "sensitivity": 0.5317543840998671 }, { "name": "model.layers.9.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006354432553052902, "sensitivity": 0.5467838656682416 }, { "name": "model.layers.9.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.151075808702444e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006448048516176641, "sensitivity": 0.5313684322241787 }, { "name": "model.layers.9.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006414763629436493, "sensitivity": 0.5388303555934773 }, { "name": "model.layers.9.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.005046770951594e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006460507865995169, "sensitivity": 0.5621515408507196 }, { "name": "model.layers.9.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7949666370404884e-05, "sensitivity": 0.7544313210468162 }, { "name": "model.layers.9.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.707196919502167e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006404236773960292, "sensitivity": 0.5420474606013896 }, { "name": "model.layers.9.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5711978347972035e-05, "sensitivity": 0.6038881845328038 }, { "name": "model.layers.9.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.876138402527431e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006185109377838671, "sensitivity": 0.532222388737757 }, { "name": "model.layers.9.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.69464718864765e-05, "sensitivity": 0.8191484681077827 }, { "name": "model.layers.9.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.550317491222813e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006967487279325724, "sensitivity": 0.5135653990615187 }, { "name": "model.layers.9.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006351706106215715, "sensitivity": 0.5818689608162618 }, { "name": "model.layers.9.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.814083010591276e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006293735932558775, "sensitivity": 0.5236818998698629 }, { "name": "model.layers.9.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9531441365834326e-05, "sensitivity": 0.7657038237963819 }, { "name": "model.layers.9.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.322194394670078e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006659358623437583, "sensitivity": 0.5706050703236533 }, { "name": "model.layers.9.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.887925362912938e-05, "sensitivity": 0.6436733083256816 }, { "name": "model.layers.9.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.167985020510969e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006619318737648427, "sensitivity": 0.5290108594967304 }, { "name": "model.layers.9.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000656602845992893, "sensitivity": 0.514097078460974 }, { "name": "model.layers.9.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.080371122152428e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006620692438445985, "sensitivity": 0.568789201208717 }, { "name": "model.layers.9.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006903898320160806, "sensitivity": 0.5320747061318578 }, { "name": "model.layers.9.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.109157766331919e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000696411938406527, "sensitivity": 0.5325078106600659 }, { "name": "model.layers.9.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006191586144268513, "sensitivity": 0.5337677012401997 }, { "name": "model.layers.9.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.873704367331811e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006208175327628851, "sensitivity": 0.5340733676269468 }, { "name": "model.layers.9.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.85506422794424e-05, "sensitivity": 1.194714820506499 }, { "name": "model.layers.9.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.117923021520255e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9208097809460014e-05, "sensitivity": 0.8647505672822122 }, { "name": "model.layers.9.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006238574278540909, "sensitivity": 0.5909321231899699 }, { "name": "model.layers.9.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.871881967323134e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006281984969973564, "sensitivity": 0.5243314329131529 }, { "name": "model.layers.9.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006588418036699295, "sensitivity": 0.5324520713097508 }, { "name": "model.layers.9.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.034725856807199e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006730224704369903, "sensitivity": 0.5007686089559134 }, { "name": "model.layers.9.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006276955245994031, "sensitivity": 0.5845460142024931 }, { "name": "model.layers.9.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.710224399990693e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006280700908973813, "sensitivity": 0.5702853254599627 }, { "name": "model.layers.9.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000672514084726572, "sensitivity": 0.5749996773039407 }, { "name": "model.layers.9.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.177214686431398e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000683644087985158, "sensitivity": 0.5450299781845642 }, { "name": "model.layers.9.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.681595575879328e-05, "sensitivity": 0.698562847652964 }, { "name": "model.layers.9.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.900087671761867e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006465903716161847, "sensitivity": 0.5772235276835196 }, { "name": "model.layers.9.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006058806902728975, "sensitivity": 0.5493285933578267 }, { "name": "model.layers.9.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.173936526465695e-07, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006226762197911739, "sensitivity": 0.5387091224318223 }, { "name": "model.layers.9.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 6.44470537736197e-06, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.7904869764606701e-06, "sensitivity": 2.098691765052987 }, { "name": "model.layers.9.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4080691244089394e-06, "sensitivity": 10.0 }, { "name": "model.layers.9.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.2826337751903338e-06, "sensitivity": 2.1041024894049896 }, { "name": "model.layers.9.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 8.414354851993266e-06, "sensitivity": 2.160577951362663 }, { "name": "model.layers.9.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.0002055278018815443, "sensitivity": 0.9758394399955677 }, { "name": "model.layers.9.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.1490264114399906e-05, "sensitivity": 1.440454501502106 }, { "name": "model.layers.9.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.602277087746188e-05, "sensitivity": 1.0306058150496469 }, { "name": "model.layers.9.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002935559896286577, "sensitivity": 0.6522346903047324 }, { "name": "model.layers.10.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.778962804470211e-05, "sensitivity": 0.9808496231820867 }, { "name": "model.layers.10.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.064718718334916e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006752474000677466, "sensitivity": 0.5051718119779935 }, { "name": "model.layers.10.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7534467487130314e-05, "sensitivity": 0.9782319225309131 }, { "name": "model.layers.10.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.307191367544874e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006685412372462451, "sensitivity": 0.5393400298205797 }, { "name": "model.layers.10.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.00432395003736e-05, "sensitivity": 0.8452413977093409 }, { "name": "model.layers.10.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.237079333004658e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007047789986245334, "sensitivity": 0.5540104723202642 }, { "name": "model.layers.10.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.144259532447904e-05, "sensitivity": 0.7316004233927859 }, { "name": "model.layers.10.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.603675046790158e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.32608644082211e-05, "sensitivity": 0.6762973472588387 }, { "name": "model.layers.10.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0532969099585898e-05, "sensitivity": 1.505433341184062 }, { "name": "model.layers.10.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.540019169027801e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8956076827598736e-05, "sensitivity": 0.6448369905623841 }, { "name": "model.layers.10.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.128969107521698e-05, "sensitivity": 0.7594544275436393 }, { "name": "model.layers.10.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.232529585759039e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007039706688374281, "sensitivity": 0.5435394746504489 }, { "name": "model.layers.10.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0184374888194725e-05, "sensitivity": 0.8801975015220301 }, { "name": "model.layers.10.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.127438609837554e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006880480796098709, "sensitivity": 0.5259072770482316 }, { "name": "model.layers.10.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006616414757445455, "sensitivity": 0.5897524633967041 }, { "name": "model.layers.10.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.301182793322369e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006962766638025641, "sensitivity": 0.5461120303176393 }, { "name": "model.layers.10.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.526706809177995e-05, "sensitivity": 0.8790529909840765 }, { "name": "model.layers.10.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.079139893699903e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006438078125938773, "sensitivity": 0.5320622667209733 }, { "name": "model.layers.10.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006738455849699676, "sensitivity": 0.5930142970596674 }, { "name": "model.layers.10.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.359173312375788e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007061576470732689, "sensitivity": 0.5269607773495272 }, { "name": "model.layers.10.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.776726902695373e-05, "sensitivity": 1.1065529440385444 }, { "name": "model.layers.10.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.896816901440616e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006651724688708782, "sensitivity": 0.5327759889330748 }, { "name": "model.layers.10.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.547194086830132e-05, "sensitivity": 1.0924891877453267 }, { "name": "model.layers.10.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.962087357147539e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8915960835292935e-05, "sensitivity": 0.7262918333389989 }, { "name": "model.layers.10.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4679723689332604e-05, "sensitivity": 0.6602954846173905 }, { "name": "model.layers.10.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.463331831379037e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006260558729991317, "sensitivity": 0.5238481079451808 }, { "name": "model.layers.10.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.650188076193444e-06, "sensitivity": 1.6087106127945627 }, { "name": "model.layers.10.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.706790489057312e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.335133755579591e-05, "sensitivity": 0.8387386607626195 }, { "name": "model.layers.10.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006929850205779076, "sensitivity": 0.5436607478452298 }, { "name": "model.layers.10.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.223152126949572e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007114153122529387, "sensitivity": 0.5116419740107498 }, { "name": "model.layers.10.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.842001337441616e-05, "sensitivity": 0.7878559624336845 }, { "name": "model.layers.10.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.935887088526215e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006724897539243102, "sensitivity": 0.5328886575378998 }, { "name": "model.layers.10.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.928682367084548e-05, "sensitivity": 0.6881578893620952 }, { "name": "model.layers.10.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.441488835662312e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007042217766866088, "sensitivity": 0.5158498920603503 }, { "name": "model.layers.10.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006556875305250287, "sensitivity": 0.5920130227006183 }, { "name": "model.layers.10.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.266907917051867e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006873593665659428, "sensitivity": 0.5453190553901024 }, { "name": "model.layers.10.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.944468648522161e-05, "sensitivity": 0.7058197019870776 }, { "name": "model.layers.10.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.172757593958522e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006910410593263805, "sensitivity": 0.5080285266049768 }, { "name": "model.layers.10.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.84337748377584e-06, "sensitivity": 1.2389759961560076 }, { "name": "model.layers.10.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.779098728453391e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006188277620822191, "sensitivity": 0.5065140885537013 }, { "name": "model.layers.10.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.701010741177015e-05, "sensitivity": 0.9420418282648158 }, { "name": "model.layers.10.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.981967206025729e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006688495050184429, "sensitivity": 0.5252855386414306 }, { "name": "model.layers.10.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.243365351110697e-05, "sensitivity": 0.6244959770091504 }, { "name": "model.layers.10.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.499245728264214e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007275642128661275, "sensitivity": 0.530632388011969 }, { "name": "model.layers.10.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.533221337827854e-05, "sensitivity": 1.1751690669302712 }, { "name": "model.layers.10.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.763337185271666e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006303695845417678, "sensitivity": 0.5563235283281187 }, { "name": "model.layers.10.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.940699338680133e-05, "sensitivity": 0.6944992359452228 }, { "name": "model.layers.10.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.463130262090999e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000705813872627914, "sensitivity": 0.5336359173587198 }, { "name": "model.layers.10.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1231291864532977e-05, "sensitivity": 1.554162935144629 }, { "name": "model.layers.10.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.213085725903511e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.047237548045814e-05, "sensitivity": 0.8435829573102192 }, { "name": "model.layers.10.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7614772231318057e-05, "sensitivity": 1.087269912938866 }, { "name": "model.layers.10.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.116522399679525e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006687987479381263, "sensitivity": 0.57025976039468 }, { "name": "model.layers.10.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.615534610114992e-05, "sensitivity": 0.9512175329683256 }, { "name": "model.layers.10.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.822868160976213e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006573497084900737, "sensitivity": 0.5171680850125782 }, { "name": "model.layers.10.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7809764257399365e-05, "sensitivity": 0.8638499247696438 }, { "name": "model.layers.10.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.2734079619986e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006624504458159208, "sensitivity": 0.5434690939074788 }, { "name": "model.layers.10.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.772476288257167e-05, "sensitivity": 0.6827774957342929 }, { "name": "model.layers.10.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.885822247364558e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000660410150885582, "sensitivity": 0.5293121346377567 }, { "name": "model.layers.10.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.087654527509585e-05, "sensitivity": 1.3635356580995002 }, { "name": "model.layers.10.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.922481361471e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000719210715033114, "sensitivity": 0.5751011870033935 }, { "name": "model.layers.10.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0184727216255851e-05, "sensitivity": 1.2260693064775512 }, { "name": "model.layers.10.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.573172868229449e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006366258021444082, "sensitivity": 0.5115146495675152 }, { "name": "model.layers.10.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006698633078485727, "sensitivity": 0.5768079236272605 }, { "name": "model.layers.10.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.309544460236793e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007010637782514095, "sensitivity": 0.5276046151208734 }, { "name": "model.layers.10.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4739241022616625e-05, "sensitivity": 0.9731364141758012 }, { "name": "model.layers.10.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.71595933251956e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006378927500918508, "sensitivity": 0.5398747472891191 }, { "name": "model.layers.10.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.134021532488987e-05, "sensitivity": 0.8709408077345695 }, { "name": "model.layers.10.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.511760375360609e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.34274329058826e-05, "sensitivity": 0.71882371589081 }, { "name": "model.layers.10.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.006375406286679e-05, "sensitivity": 0.6771858240138329 }, { "name": "model.layers.10.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.31224509106687e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006935363635420799, "sensitivity": 0.5604030110397549 }, { "name": "model.layers.10.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.742789289797656e-05, "sensitivity": 1.0052689513331678 }, { "name": "model.layers.10.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.866429546586005e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000650921487249434, "sensitivity": 0.522069850279115 }, { "name": "model.layers.10.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.552671427722089e-05, "sensitivity": 1.158538280144923 }, { "name": "model.layers.10.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.039290951775911e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.762848741142079e-05, "sensitivity": 0.9010368646277446 }, { "name": "model.layers.10.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0471079804119654e-05, "sensitivity": 1.9210646470851043 }, { "name": "model.layers.10.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.425506171581219e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006750381435267627, "sensitivity": 0.5341414053330147 }, { "name": "model.layers.10.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006994003779254854, "sensitivity": 0.5686492270933112 }, { "name": "model.layers.10.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.64010599393805e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000718334224075079, "sensitivity": 0.5367061697071026 }, { "name": "model.layers.10.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.887453880859539e-05, "sensitivity": 0.8362507605393498 }, { "name": "model.layers.10.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.303559985099128e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006775199435651302, "sensitivity": 0.5485535195886381 }, { "name": "model.layers.10.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.144210055936128e-05, "sensitivity": 0.6682585427460439 }, { "name": "model.layers.10.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.125196136963496e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006938920123502612, "sensitivity": 0.5206058271769154 }, { "name": "model.layers.10.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9981677622999996e-05, "sensitivity": 0.6431723086640958 }, { "name": "model.layers.10.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.057729251551791e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006922089378349483, "sensitivity": 0.5582496069687256 }, { "name": "model.layers.10.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6281387514900416e-05, "sensitivity": 0.8003988698776401 }, { "name": "model.layers.10.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.327399546535162e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006650573341175914, "sensitivity": 0.5429115518341779 }, { "name": "model.layers.10.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7886805734597147e-05, "sensitivity": 0.7538841314440521 }, { "name": "model.layers.10.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.039653044354054e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006681226077489555, "sensitivity": 0.5520602870390326 }, { "name": "model.layers.10.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1628125321294647e-05, "sensitivity": 1.5218407304683867 }, { "name": "model.layers.10.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.658849542873213e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007303711026906967, "sensitivity": 0.53915012451045 }, { "name": "model.layers.10.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8796485973289236e-05, "sensitivity": 1.1188212545506375 }, { "name": "model.layers.10.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.890545367037703e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006701587699353695, "sensitivity": 0.5614258398081984 }, { "name": "model.layers.10.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0783942899433896e-05, "sensitivity": 1.1386557250299758 }, { "name": "model.layers.10.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.191226020746399e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.22677180217579e-05, "sensitivity": 0.8639922171816867 }, { "name": "model.layers.10.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0107580793555826e-05, "sensitivity": 0.6279555591419329 }, { "name": "model.layers.10.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.181865614962589e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006940255407243967, "sensitivity": 0.5260646146077993 }, { "name": "model.layers.10.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.915312794968486e-05, "sensitivity": 0.6100909152600885 }, { "name": "model.layers.10.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.114302095738822e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006946211215108633, "sensitivity": 0.5148680858091058 }, { "name": "model.layers.10.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.64923211641144e-05, "sensitivity": 0.7473449466492628 }, { "name": "model.layers.10.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.795059792035318e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006573262508027256, "sensitivity": 0.5162583412914175 }, { "name": "model.layers.10.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.698015957023017e-05, "sensitivity": 0.9999476831875491 }, { "name": "model.layers.10.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.712337838303938e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006531418184749782, "sensitivity": 0.5387711896575971 }, { "name": "model.layers.10.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9089372371090576e-05, "sensitivity": 0.7833055748671565 }, { "name": "model.layers.10.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.964518206586945e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007000688347034156, "sensitivity": 0.5196541942562746 }, { "name": "model.layers.10.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.14955642959103e-05, "sensitivity": 0.6710319048868427 }, { "name": "model.layers.10.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.191843908709416e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007032208959572017, "sensitivity": 0.5080426789267921 }, { "name": "model.layers.10.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0548700275830925e-05, "sensitivity": 0.8251030837695996 }, { "name": "model.layers.10.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.472560016845819e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007117760251276195, "sensitivity": 0.5133899109601321 }, { "name": "model.layers.10.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.771568976342678e-05, "sensitivity": 0.758481966186873 }, { "name": "model.layers.10.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.779335197075852e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006465050973929465, "sensitivity": 0.5183906604730939 }, { "name": "model.layers.10.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007342511671595275, "sensitivity": 0.5209691324399041 }, { "name": "model.layers.10.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.674192150057934e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007591458852402866, "sensitivity": 0.5190607569985405 }, { "name": "model.layers.10.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.461570617626421e-05, "sensitivity": 0.8783931479536159 }, { "name": "model.layers.10.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.73069769416179e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006302502006292343, "sensitivity": 0.5215380516650012 }, { "name": "model.layers.10.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.777849582955241e-05, "sensitivity": 1.0238632714599207 }, { "name": "model.layers.10.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.784729637525743e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006464679609052837, "sensitivity": 0.5561990382867451 }, { "name": "model.layers.10.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.380992661230266e-05, "sensitivity": 0.8100174360649663 }, { "name": "model.layers.10.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.691909450433741e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006254971376620233, "sensitivity": 0.539287262156092 }, { "name": "model.layers.10.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.144361395854503e-05, "sensitivity": 1.1200247679100033 }, { "name": "model.layers.10.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.507192438220955e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007031867280602455, "sensitivity": 0.5315708949210067 }, { "name": "model.layers.10.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.967274046270177e-05, "sensitivity": 0.746719720362562 }, { "name": "model.layers.10.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.204717237778823e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00069528998574242, "sensitivity": 0.56651622729987 }, { "name": "model.layers.10.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.141478661447763e-05, "sensitivity": 0.8648946498828997 }, { "name": "model.layers.10.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.280773732214584e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007168831652961671, "sensitivity": 0.5201995862694142 }, { "name": "model.layers.10.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.281946843955666e-05, "sensitivity": 0.6798635587957006 }, { "name": "model.layers.10.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.243961590575054e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007604529964737594, "sensitivity": 0.5866853242128609 }, { "name": "model.layers.10.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.060205851099454e-05, "sensitivity": 0.6125099777906133 }, { "name": "model.layers.10.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.221889066182484e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007032882422208786, "sensitivity": 0.5248706246353323 }, { "name": "model.layers.10.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 6.57720556773711e-06, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.9092685761279427e-06, "sensitivity": 2.0988195862676102 }, { "name": "model.layers.10.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.782430995779578e-07, "sensitivity": 10.0 }, { "name": "model.layers.10.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.2594293821166502e-06, "sensitivity": 2.1033093244414762 }, { "name": "model.layers.10.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 2.1491863662959076e-05, "sensitivity": 1.7644165736283748 }, { "name": "model.layers.10.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00017753778956830502, "sensitivity": 0.9936385060102264 }, { "name": "model.layers.10.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 5, "mse": 3.0599258025176823e-06, "sensitivity": 2.10302519579803 }, { "name": "model.layers.10.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 2, "mse": 0.0004934285534545779, "sensitivity": 0.5894430113653066 }, { "name": "model.layers.10.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00029263197211548686, "sensitivity": 0.902501797067964 }, { "name": "model.layers.11.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0361402574926615e-05, "sensitivity": 0.6023706760633327 }, { "name": "model.layers.11.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.172108442115132e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007052895962260664, "sensitivity": 0.5280479543794034 }, { "name": "model.layers.11.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.796973709948361e-05, "sensitivity": 0.8081416404807281 }, { "name": "model.layers.11.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.234729426068952e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006920655723661184, "sensitivity": 0.5008211818358708 }, { "name": "model.layers.11.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.50604127056431e-05, "sensitivity": 0.6825722054111821 }, { "name": "model.layers.11.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.276766271184897e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.470716132549569e-05, "sensitivity": 0.7387491204557114 }, { "name": "model.layers.11.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8363650168757886e-05, "sensitivity": 0.7906022137508409 }, { "name": "model.layers.11.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.287403948590509e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000694180082064122, "sensitivity": 0.5173936149719223 }, { "name": "model.layers.11.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.77527898713015e-05, "sensitivity": 1.0504680668502608 }, { "name": "model.layers.11.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.632783424720401e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8749705203808844e-05, "sensitivity": 1.1350975070586211 }, { "name": "model.layers.11.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.228358688531443e-05, "sensitivity": 0.618975170927762 }, { "name": "model.layers.11.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.916468464623904e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007170757162384689, "sensitivity": 0.5264530139960808 }, { "name": "model.layers.11.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006860606372356415, "sensitivity": 0.5438726011741133 }, { "name": "model.layers.11.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.266598688853264e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007181983673945069, "sensitivity": 0.5324002202044814 }, { "name": "model.layers.11.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.403661483185715e-06, "sensitivity": 2.097466040063141 }, { "name": "model.layers.11.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.823446933092782e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.427839980460703e-05, "sensitivity": 0.6278238452756947 }, { "name": "model.layers.11.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.762535147368908e-05, "sensitivity": 0.650545012628262 }, { "name": "model.layers.11.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.37450284557417e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006798223475925624, "sensitivity": 0.5165541623544111 }, { "name": "model.layers.11.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006627188413403928, "sensitivity": 0.5904622879878545 }, { "name": "model.layers.11.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.955495794296439e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006831339560449123, "sensitivity": 0.5784976605018954 }, { "name": "model.layers.11.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006859493441879749, "sensitivity": 0.5017361679737629 }, { "name": "model.layers.11.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.405493877537083e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007233502110466361, "sensitivity": 0.55555555551672 }, { "name": "model.layers.11.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.644105112878606e-05, "sensitivity": 0.8787458854404175 }, { "name": "model.layers.11.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.439665180048905e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.937464811722748e-05, "sensitivity": 0.7762796699869896 }, { "name": "model.layers.11.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.886988219572231e-05, "sensitivity": 0.8668026831853006 }, { "name": "model.layers.11.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.19658749201335e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006812134524807334, "sensitivity": 0.5486142293116909 }, { "name": "model.layers.11.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.662973126163706e-05, "sensitivity": 0.9019174061084743 }, { "name": "model.layers.11.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.953352797405387e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006472700042650104, "sensitivity": 0.5643055778385534 }, { "name": "model.layers.11.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7433393521932885e-05, "sensitivity": 0.9361358457705721 }, { "name": "model.layers.11.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.095330829542945e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006540577742271125, "sensitivity": 0.5438391747410771 }, { "name": "model.layers.11.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006754290661774576, "sensitivity": 0.5286697780077116 }, { "name": "model.layers.11.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.571437438651628e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007088728016242385, "sensitivity": 0.5463444711450689 }, { "name": "model.layers.11.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0202095836575609e-05, "sensitivity": 1.4232004278743426 }, { "name": "model.layers.11.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.725365437887376e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.886871804250404e-05, "sensitivity": 0.6875892995738143 }, { "name": "model.layers.11.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006926845526322722, "sensitivity": 0.5800302195806806 }, { "name": "model.layers.11.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.839285333626322e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.422249134629965e-05, "sensitivity": 0.6418741316797166 }, { "name": "model.layers.11.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006565148942172527, "sensitivity": 0.5599577061611214 }, { "name": "model.layers.11.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.270253720686014e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006770341424271464, "sensitivity": 0.5527231137950138 }, { "name": "model.layers.11.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.935416993452236e-05, "sensitivity": 1.022477491420641 }, { "name": "model.layers.11.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.224217372619023e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006962606566958129, "sensitivity": 0.5119732962936744 }, { "name": "model.layers.11.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.591745866695419e-05, "sensitivity": 0.6805142027780415 }, { "name": "model.layers.11.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.949731303189765e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006670517614111304, "sensitivity": 0.5395684475642144 }, { "name": "model.layers.11.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.790618888568133e-05, "sensitivity": 0.6380648442996587 }, { "name": "model.layers.11.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.040619950908876e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006646787514910102, "sensitivity": 0.5860625029012416 }, { "name": "model.layers.11.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007038038456812501, "sensitivity": 0.5551057678722349 }, { "name": "model.layers.11.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.126035370674799e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.692273746011779e-05, "sensitivity": 0.7558305776427597 }, { "name": "model.layers.11.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.390015576267615e-05, "sensitivity": 1.1362201423727611 }, { "name": "model.layers.11.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.538638561120024e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006249562720768154, "sensitivity": 0.5694440592479623 }, { "name": "model.layers.11.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006947522051632404, "sensitivity": 0.5144441311715582 }, { "name": "model.layers.11.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.696482159895822e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007362505421042442, "sensitivity": 0.5251897303512247 }, { "name": "model.layers.11.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006693325703963637, "sensitivity": 0.5108378074312884 }, { "name": "model.layers.11.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.607107252420974e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007056001340970397, "sensitivity": 0.528142451101946 }, { "name": "model.layers.11.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006922582979314029, "sensitivity": 0.579023753489149 }, { "name": "model.layers.11.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.596705475203635e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.536625733133405e-05, "sensitivity": 0.6089873681505772 }, { "name": "model.layers.11.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.17992045590654e-05, "sensitivity": 0.7957411506249544 }, { "name": "model.layers.11.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.373907126544509e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007114330073818564, "sensitivity": 0.5401249016879698 }, { "name": "model.layers.11.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.080843048839597e-05, "sensitivity": 1.425282703934228 }, { "name": "model.layers.11.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.957941423024749e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.979530396871269e-05, "sensitivity": 0.6012036054417664 }, { "name": "model.layers.11.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.944816439296119e-05, "sensitivity": 0.8203063577633689 }, { "name": "model.layers.11.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.228935944818659e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006860228604637086, "sensitivity": 0.5827092079854196 }, { "name": "model.layers.11.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.596108894678764e-05, "sensitivity": 0.6798547915571933 }, { "name": "model.layers.11.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.9319359024812e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.64186557312496e-05, "sensitivity": 0.8254945364652033 }, { "name": "model.layers.11.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.091125396778807e-05, "sensitivity": 0.6321540252624798 }, { "name": "model.layers.11.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.220875548024196e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007153353653848171, "sensitivity": 0.5433718656990403 }, { "name": "model.layers.11.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.748809780925512e-05, "sensitivity": 0.6948426392057012 }, { "name": "model.layers.11.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.984868494124385e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.049437070032582e-05, "sensitivity": 0.6192686923464186 }, { "name": "model.layers.11.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006850312929600477, "sensitivity": 0.5633331029419104 }, { "name": "model.layers.11.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.414306881197263e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000725744990631938, "sensitivity": 0.5369430009841447 }, { "name": "model.layers.11.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006689398433081806, "sensitivity": 0.5337652418166731 }, { "name": "model.layers.11.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.300426207417331e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006982035702094436, "sensitivity": 0.5570071063205955 }, { "name": "model.layers.11.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.682997188065201e-06, "sensitivity": 1.8274658013207374 }, { "name": "model.layers.11.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.3816705758436e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005963838775642216, "sensitivity": 0.549014354845991 }, { "name": "model.layers.11.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.693256025551818e-05, "sensitivity": 0.6572753450867674 }, { "name": "model.layers.11.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.95229380451201e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006504305056296289, "sensitivity": 0.5209342719672923 }, { "name": "model.layers.11.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006721990648657084, "sensitivity": 0.5245708008429625 }, { "name": "model.layers.11.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.28543091352185e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007129220175556839, "sensitivity": 0.5021148290848686 }, { "name": "model.layers.11.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006717243231832981, "sensitivity": 0.540784433525504 }, { "name": "model.layers.11.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.134287673376093e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006887810304760933, "sensitivity": 0.4994425966188444 }, { "name": "model.layers.11.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000666693493258208, "sensitivity": 0.5450596204860867 }, { "name": "model.layers.11.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.160976226965431e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006850412464700639, "sensitivity": 0.5384600800959418 }, { "name": "model.layers.11.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.468774806009606e-06, "sensitivity": 1.9034568831917276 }, { "name": "model.layers.11.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.509797347258427e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.04466297570616e-05, "sensitivity": 0.7891271073961957 }, { "name": "model.layers.11.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.70408564171521e-06, "sensitivity": 1.9133009934411283 }, { "name": "model.layers.11.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.583925144492241e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.559333294513635e-05, "sensitivity": 0.697246217815531 }, { "name": "model.layers.11.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.218800990609452e-05, "sensitivity": 0.9512563526268878 }, { "name": "model.layers.11.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.935513283679029e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007269473280757666, "sensitivity": 0.5544312460110434 }, { "name": "model.layers.11.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.866777428309433e-05, "sensitivity": 0.6818237236290683 }, { "name": "model.layers.11.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.44535703031579e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.051356831449084e-05, "sensitivity": 0.8535566569019615 }, { "name": "model.layers.11.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006603755755349994, "sensitivity": 0.550940301614032 }, { "name": "model.layers.11.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.143900463939644e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000676508410833776, "sensitivity": 0.5489237568247056 }, { "name": "model.layers.11.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.841855899139773e-06, "sensitivity": 1.2971400353428502 }, { "name": "model.layers.11.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.618725253953016e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000631738337688148, "sensitivity": 0.5554754834953265 }, { "name": "model.layers.11.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006738192751072347, "sensitivity": 0.5895826383135829 }, { "name": "model.layers.11.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.205902423062071e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006933609838597476, "sensitivity": 0.5189650738235299 }, { "name": "model.layers.11.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.880012031411752e-05, "sensitivity": 0.709440769729506 }, { "name": "model.layers.11.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.112150003900751e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006759336101822555, "sensitivity": 0.5492671763455518 }, { "name": "model.layers.11.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.119678437244147e-05, "sensitivity": 0.9698874659095851 }, { "name": "model.layers.11.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.392330078597297e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007246757159009576, "sensitivity": 0.5291056580223185 }, { "name": "model.layers.11.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.839896039105952e-05, "sensitivity": 0.9793326648294476 }, { "name": "model.layers.11.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.638394438596151e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006820972776040435, "sensitivity": 0.5195699758374454 }, { "name": "model.layers.11.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.910825711907819e-05, "sensitivity": 0.8155130115022294 }, { "name": "model.layers.11.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.276574708863336e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006781625561416149, "sensitivity": 0.5942577881963579 }, { "name": "model.layers.11.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0248892067465931e-05, "sensitivity": 1.274213226435846 }, { "name": "model.layers.11.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.370079859152611e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7557568652555346e-05, "sensitivity": 0.7857790677345432 }, { "name": "model.layers.11.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006621081265620887, "sensitivity": 0.5653875140227614 }, { "name": "model.layers.11.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.160271368571557e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006808030302636325, "sensitivity": 0.5245687024719512 }, { "name": "model.layers.11.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.034388206899166e-05, "sensitivity": 0.7865951118755241 }, { "name": "model.layers.11.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.59787929180311e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007238417165353894, "sensitivity": 0.531128523773392 }, { "name": "model.layers.11.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000656680203974247, "sensitivity": 0.5545149699665356 }, { "name": "model.layers.11.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.142943220766028e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006878200802020729, "sensitivity": 0.5517254511661365 }, { "name": "model.layers.11.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.977490218356252e-05, "sensitivity": 0.7728735486051791 }, { "name": "model.layers.11.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.262003691721475e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.068415677873418e-05, "sensitivity": 0.7359972130515529 }, { "name": "model.layers.11.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7529086916474625e-05, "sensitivity": 0.6541230428945418 }, { "name": "model.layers.11.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.247022383831791e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006725979037582874, "sensitivity": 0.545783899722834 }, { "name": "model.layers.11.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006666940171271563, "sensitivity": 0.5393477791381771 }, { "name": "model.layers.11.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.956017048447393e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006787478923797607, "sensitivity": 0.5193965770765014 }, { "name": "model.layers.11.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007116055930964649, "sensitivity": 0.5163983060021724 }, { "name": "model.layers.11.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.512381673928758e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007416519219987094, "sensitivity": 0.5178389475122684 }, { "name": "model.layers.11.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8444922615308315e-05, "sensitivity": 0.8261181781636844 }, { "name": "model.layers.11.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.295658749877475e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000682335696183145, "sensitivity": 0.5223030956951871 }, { "name": "model.layers.11.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6408505770377815e-05, "sensitivity": 0.6628780297005148 }, { "name": "model.layers.11.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.781495815426752e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.803595558973029e-05, "sensitivity": 0.6451308050004336 }, { "name": "model.layers.11.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.899274765397422e-05, "sensitivity": 0.6830752360480908 }, { "name": "model.layers.11.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.223424406925915e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006920045125298202, "sensitivity": 0.5066886713573628 }, { "name": "model.layers.11.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0709998605307192e-05, "sensitivity": 1.2760941291913044 }, { "name": "model.layers.11.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.252533353290346e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.027795825502835e-05, "sensitivity": 0.8235260172182701 }, { "name": "model.layers.11.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006741394754499197, "sensitivity": 0.5278701970270008 }, { "name": "model.layers.11.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.105874490458518e-07, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.221261719474569e-05, "sensitivity": 0.6992084989593526 }, { "name": "model.layers.11.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 6.385485448845429e-06, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.8400713770461152e-06, "sensitivity": 2.099326973997355 }, { "name": "model.layers.11.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.102072360481543e-06, "sensitivity": 10.0 }, { "name": "model.layers.11.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.3309794439919642e-06, "sensitivity": 2.104988802766868 }, { "name": "model.layers.11.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 6.134292107162764e-06, "sensitivity": 2.1752904397754556 }, { "name": "model.layers.11.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.0001630842889426276, "sensitivity": 0.91040535852251 }, { "name": "model.layers.11.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.0399892744317185e-05, "sensitivity": 1.1543488108497717 }, { "name": "model.layers.11.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 4.889959382126108e-05, "sensitivity": 1.1891302646168425 }, { "name": "model.layers.11.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002651199174579233, "sensitivity": 0.7803161949184054 }, { "name": "model.layers.12.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.636231799144298e-05, "sensitivity": 0.759941182257984 }, { "name": "model.layers.12.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.427370635719853e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8909979998134077e-05, "sensitivity": 1.1783281600549604 }, { "name": "model.layers.12.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.885998689336702e-05, "sensitivity": 0.6052555123571318 }, { "name": "model.layers.12.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.312442337730317e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.163920625112951e-05, "sensitivity": 0.8114663749770405 }, { "name": "model.layers.12.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.16736215306446e-05, "sensitivity": 0.6785402879889288 }, { "name": "model.layers.12.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.606627150380518e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.306769500952214e-05, "sensitivity": 0.6194891774456395 }, { "name": "model.layers.12.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000690278597176075, "sensitivity": 0.524743339363307 }, { "name": "model.layers.12.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.420559657271951e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000710082589648664, "sensitivity": 0.5384992863421173 }, { "name": "model.layers.12.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.317780935205519e-05, "sensitivity": 0.6219981239749898 }, { "name": "model.layers.12.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.580711442438769e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007336337002925575, "sensitivity": 0.5758093757841802 }, { "name": "model.layers.12.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006245928816497326, "sensitivity": 0.5988081480886636 }, { "name": "model.layers.12.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.523567097043269e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.4885458666831255e-05, "sensitivity": 0.9914702905728707 }, { "name": "model.layers.12.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.595500624622218e-05, "sensitivity": 0.9312701325656729 }, { "name": "model.layers.12.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.838442120875698e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006642492371611297, "sensitivity": 0.5192191854100985 }, { "name": "model.layers.12.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006637185579165816, "sensitivity": 0.5257544706036732 }, { "name": "model.layers.12.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.047702072464745e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006839375710114837, "sensitivity": 0.5166358711770291 }, { "name": "model.layers.12.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.008095806464553e-05, "sensitivity": 0.6824242869315277 }, { "name": "model.layers.12.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.122874083303032e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006983274943195283, "sensitivity": 0.5483046700953289 }, { "name": "model.layers.12.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007211598567664623, "sensitivity": 0.5625624691591881 }, { "name": "model.layers.12.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.72952126024029e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007581400568597019, "sensitivity": 0.5145075777179439 }, { "name": "model.layers.12.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007176985964179039, "sensitivity": 0.5463312023465541 }, { "name": "model.layers.12.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.602411986023071e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007460913620889187, "sensitivity": 0.5287646178753407 }, { "name": "model.layers.12.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.719728869735263e-05, "sensitivity": 0.8605215666175463 }, { "name": "model.layers.12.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.104115411493694e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006626652320846915, "sensitivity": 0.5723892507682504 }, { "name": "model.layers.12.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6729149946477264e-05, "sensitivity": 0.7278545898064479 }, { "name": "model.layers.12.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.902280690861517e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.847858119523153e-05, "sensitivity": 0.6029579562844388 }, { "name": "model.layers.12.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.616607813863084e-05, "sensitivity": 0.9962050025239464 }, { "name": "model.layers.12.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.272196060308488e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006395844975486398, "sensitivity": 0.5959007710118852 }, { "name": "model.layers.12.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.193454464664683e-05, "sensitivity": 0.8596183987038384 }, { "name": "model.layers.12.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.583025762869511e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.407278124243021e-05, "sensitivity": 0.645775327782902 }, { "name": "model.layers.12.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006151042180135846, "sensitivity": 0.5715881071228238 }, { "name": "model.layers.12.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.563301783695351e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.576456896960735e-05, "sensitivity": 0.8741769960792249 }, { "name": "model.layers.12.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006883294554427266, "sensitivity": 0.5524746770111341 }, { "name": "model.layers.12.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.218586463546671e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007106189150363207, "sensitivity": 0.5664784169409872 }, { "name": "model.layers.12.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.069099981687032e-05, "sensitivity": 0.9454817582355571 }, { "name": "model.layers.12.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.739806164863694e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.317460065474734e-05, "sensitivity": 0.6607912575645426 }, { "name": "model.layers.12.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007170591270551085, "sensitivity": 0.5345769820749555 }, { "name": "model.layers.12.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.787880693082116e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007515839533880353, "sensitivity": 0.5697470816425864 }, { "name": "model.layers.12.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007043037912808359, "sensitivity": 0.5539295752609752 }, { "name": "model.layers.12.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.859660857116978e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007318216376006603, "sensitivity": 0.5338595850081986 }, { "name": "model.layers.12.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006845784373581409, "sensitivity": 0.5854048880502086 }, { "name": "model.layers.12.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.328408517219941e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007082149386405945, "sensitivity": 0.5176717430356143 }, { "name": "model.layers.12.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006512944819405675, "sensitivity": 0.5503723284355205 }, { "name": "model.layers.12.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.419925284717465e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006700567901134491, "sensitivity": 0.5211531160382458 }, { "name": "model.layers.12.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006482729222625494, "sensitivity": 0.5839189274362098 }, { "name": "model.layers.12.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.799781206405896e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006592727149836719, "sensitivity": 0.5063560594215736 }, { "name": "model.layers.12.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006684426916763186, "sensitivity": 0.5336485336249982 }, { "name": "model.layers.12.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.239761205506511e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007109094294719398, "sensitivity": 0.5174259363924817 }, { "name": "model.layers.12.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006635827012360096, "sensitivity": 0.5965074823943557 }, { "name": "model.layers.12.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.283787001848395e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006861781002953649, "sensitivity": 0.5493419119169018 }, { "name": "model.layers.12.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006719328230246902, "sensitivity": 0.5252050474422184 }, { "name": "model.layers.12.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.083722610128461e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006848800694569945, "sensitivity": 0.5463853861343517 }, { "name": "model.layers.12.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.940850678598508e-05, "sensitivity": 0.9959811344470813 }, { "name": "model.layers.12.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.503490794784739e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.1132693543913774e-05, "sensitivity": 1.2817616791606552 }, { "name": "model.layers.12.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0623464378295466e-05, "sensitivity": 0.7066081171975909 }, { "name": "model.layers.12.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.67514541419223e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006964506465010345, "sensitivity": 0.5027131402154881 }, { "name": "model.layers.12.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0283608036115766e-05, "sensitivity": 0.616603805971583 }, { "name": "model.layers.12.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.302692554527312e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006913223769515753, "sensitivity": 0.505025460798008 }, { "name": "model.layers.12.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006944821216166019, "sensitivity": 0.5823518498880056 }, { "name": "model.layers.12.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.885998118377756e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007446687086485326, "sensitivity": 0.5688143900828186 }, { "name": "model.layers.12.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.674914427800104e-05, "sensitivity": 0.6660712865562357 }, { "name": "model.layers.12.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.057632049305539e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006540852482430637, "sensitivity": 0.5245099026296792 }, { "name": "model.layers.12.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.238535570446402e-05, "sensitivity": 0.6118556346523719 }, { "name": "model.layers.12.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.60478121972119e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007288106717169285, "sensitivity": 0.5159612870846828 }, { "name": "model.layers.12.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007051985594443977, "sensitivity": 0.5340425872571704 }, { "name": "model.layers.12.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.466189006459899e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007267742766998708, "sensitivity": 0.5248515166328314 }, { "name": "model.layers.12.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.385624535847455e-05, "sensitivity": 0.8736300063846498 }, { "name": "model.layers.12.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.522975925487117e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006162581848911941, "sensitivity": 0.5334058310255637 }, { "name": "model.layers.12.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006579109467566013, "sensitivity": 0.5773858269609038 }, { "name": "model.layers.12.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.718190661558765e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006853702361695468, "sensitivity": 0.5468656353303916 }, { "name": "model.layers.12.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.161972851259634e-05, "sensitivity": 0.6290586947402512 }, { "name": "model.layers.12.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.564848149537283e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007047991966828704, "sensitivity": 0.5785443512187254 }, { "name": "model.layers.12.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.58749889023602e-05, "sensitivity": 0.8212811502582554 }, { "name": "model.layers.12.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.727212505415082e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8657162298914045e-05, "sensitivity": 0.792732587607683 }, { "name": "model.layers.12.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.304238922894001e-05, "sensitivity": 0.7313718832234587 }, { "name": "model.layers.12.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.779403065593215e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000730621803086251, "sensitivity": 0.5567458527328897 }, { "name": "model.layers.12.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7611610827734694e-05, "sensitivity": 1.0870911758806787 }, { "name": "model.layers.12.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.415647249014e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9877980675082654e-05, "sensitivity": 0.9761021390666428 }, { "name": "model.layers.12.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.00541643507313e-05, "sensitivity": 0.7208335181804948 }, { "name": "model.layers.12.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.413828259610455e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007322716410271823, "sensitivity": 0.5298101616918476 }, { "name": "model.layers.12.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.419850251404569e-05, "sensitivity": 0.6073675110651314 }, { "name": "model.layers.12.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.151706995500717e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007453008438460529, "sensitivity": 0.5452027474865949 }, { "name": "model.layers.12.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.186957762110978e-05, "sensitivity": 0.7889542365813849 }, { "name": "model.layers.12.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.502183964585129e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007367273792624474, "sensitivity": 0.5953982299213705 }, { "name": "model.layers.12.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.780162973678671e-05, "sensitivity": 0.7734870348426193 }, { "name": "model.layers.12.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.091003683650342e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006675328477285802, "sensitivity": 0.5405408303012746 }, { "name": "model.layers.12.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.146676605567336e-05, "sensitivity": 0.7816314965604535 }, { "name": "model.layers.12.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.444603855015885e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007009041728451848, "sensitivity": 0.5102425379002148 }, { "name": "model.layers.12.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.786094334325753e-05, "sensitivity": 0.7669438416807197 }, { "name": "model.layers.12.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.27041060852207e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006651963340118527, "sensitivity": 0.5817342957048908 }, { "name": "model.layers.12.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007323298486880958, "sensitivity": 0.5166590418411565 }, { "name": "model.layers.12.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.707585953336093e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007603932172060013, "sensitivity": 0.5292782400807197 }, { "name": "model.layers.12.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7907323935069144e-05, "sensitivity": 1.004960405898511 }, { "name": "model.layers.12.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.862941290819435e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006639162893407047, "sensitivity": 0.548907375743311 }, { "name": "model.layers.12.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006751944310963154, "sensitivity": 0.5890137764023573 }, { "name": "model.layers.12.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.239547474251594e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.22452498646453e-05, "sensitivity": 0.6603000649427458 }, { "name": "model.layers.12.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006585297523997724, "sensitivity": 0.5311659798909181 }, { "name": "model.layers.12.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.011956656948314e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006844803574495018, "sensitivity": 0.5314891345534339 }, { "name": "model.layers.12.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007072719745337963, "sensitivity": 0.53490122451838 }, { "name": "model.layers.12.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.691041107842466e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007390842656604946, "sensitivity": 0.5241588671009685 }, { "name": "model.layers.12.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.484713983605616e-05, "sensitivity": 0.8511848218081453 }, { "name": "model.layers.12.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.514946792573028e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006099209422245622, "sensitivity": 0.561864462305743 }, { "name": "model.layers.12.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.809974391013384e-05, "sensitivity": 0.7752764838575913 }, { "name": "model.layers.12.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.017108944433858e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.836947093484923e-05, "sensitivity": 0.8518957944026155 }, { "name": "model.layers.12.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000695945811457932, "sensitivity": 0.5808690172160238 }, { "name": "model.layers.12.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.415431812456518e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007319545256905258, "sensitivity": 0.5106654008651896 }, { "name": "model.layers.12.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006759455427527428, "sensitivity": 0.5297197531006302 }, { "name": "model.layers.12.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.26090752575692e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007022283971309662, "sensitivity": 0.5227785144235431 }, { "name": "model.layers.12.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0307262174319476e-05, "sensitivity": 0.8761861824537265 }, { "name": "model.layers.12.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.386932795976463e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006974959978833795, "sensitivity": 0.5341785236819516 }, { "name": "model.layers.12.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.196570757310838e-05, "sensitivity": 0.6480543425900495 }, { "name": "model.layers.12.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.556338121299632e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007126411655917764, "sensitivity": 0.5170662940090835 }, { "name": "model.layers.12.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0801064490806311e-05, "sensitivity": 1.856151173347638 }, { "name": "model.layers.12.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.284759592745104e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006966108921915293, "sensitivity": 0.5420684024716232 }, { "name": "model.layers.12.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.263422255869955e-05, "sensitivity": 0.7115034837371867 }, { "name": "model.layers.12.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.878997282910859e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007527022971771657, "sensitivity": 0.5329304014663769 }, { "name": "model.layers.12.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9890324337175116e-05, "sensitivity": 0.6643975490737969 }, { "name": "model.layers.12.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.158810492706834e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006951118703000247, "sensitivity": 0.5748505417588756 }, { "name": "model.layers.12.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000683491351082921, "sensitivity": 0.554210340379596 }, { "name": "model.layers.12.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.245331292120682e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007000734331086278, "sensitivity": 0.5481569993152704 }, { "name": "model.layers.12.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.06515932304319e-05, "sensitivity": 0.6110218055036527 }, { "name": "model.layers.12.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.449399734265171e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006991593400016427, "sensitivity": 0.5239039827362704 }, { "name": "model.layers.12.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0656690392352175e-05, "sensitivity": 1.281168874430988 }, { "name": "model.layers.12.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.129753723551403e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.814119867864065e-05, "sensitivity": 0.8146663146216453 }, { "name": "model.layers.12.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0369155461376067e-05, "sensitivity": 1.4073382385969764 }, { "name": "model.layers.12.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.251212880670209e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006831069476902485, "sensitivity": 0.5749013438627224 }, { "name": "model.layers.12.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8865563914878294e-05, "sensitivity": 1.06878296463252 }, { "name": "model.layers.12.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.393595413101139e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007081844378262758, "sensitivity": 0.5352382692357747 }, { "name": "model.layers.12.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 7.578591066703666e-06, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.992287479879451e-06, "sensitivity": 2.0987521082387626 }, { "name": "model.layers.12.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.026938189686916e-07, "sensitivity": 10.0 }, { "name": "model.layers.12.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 6.208537342899945e-06, "sensitivity": 1.8711669473939367 }, { "name": "model.layers.12.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 2.2511312636197545e-05, "sensitivity": 1.9150231379964497 }, { "name": "model.layers.12.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.0001565248385304585, "sensitivity": 1.0476692840587734 }, { "name": "model.layers.12.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.235627587448107e-05, "sensitivity": 1.934892637538176 }, { "name": "model.layers.12.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 2, "mse": 0.0005378288915380836, "sensitivity": 0.5895019700751076 }, { "name": "model.layers.12.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00027789006708189845, "sensitivity": 0.807532544710627 }, { "name": "model.layers.13.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006705971900373697, "sensitivity": 0.5418482597497432 }, { "name": "model.layers.13.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.104689873609459e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000683736230712384, "sensitivity": 0.5322144039325415 }, { "name": "model.layers.13.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8918300055665895e-05, "sensitivity": 0.7330366477697594 }, { "name": "model.layers.13.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.298735115706222e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006687843124382198, "sensitivity": 0.5161391331175633 }, { "name": "model.layers.13.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0258132533635944e-05, "sensitivity": 1.2529397344145543 }, { "name": "model.layers.13.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.859164957655594e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000638830941170454, "sensitivity": 0.5099671450630836 }, { "name": "model.layers.13.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.969023550278507e-05, "sensitivity": 0.9028159954690793 }, { "name": "model.layers.13.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.478475711446663e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007094345055520535, "sensitivity": 0.5768295944073324 }, { "name": "model.layers.13.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007315609836950898, "sensitivity": 0.5593875736758074 }, { "name": "model.layers.13.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.61428828152566e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007571796304546297, "sensitivity": 0.5149253875718489 }, { "name": "model.layers.13.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006658544298261404, "sensitivity": 0.5359408541017547 }, { "name": "model.layers.13.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.266459990911244e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006931519019417465, "sensitivity": 0.5371587892424631 }, { "name": "model.layers.13.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.828064604429528e-05, "sensitivity": 0.7821515051272174 }, { "name": "model.layers.13.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.320101988421811e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006783092394471169, "sensitivity": 0.5268608277509137 }, { "name": "model.layers.13.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.405344902304932e-05, "sensitivity": 0.6630617834159483 }, { "name": "model.layers.13.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.282798151209136e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007611599285155535, "sensitivity": 0.5363047656552119 }, { "name": "model.layers.13.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007043571094982326, "sensitivity": 0.5170317024911938 }, { "name": "model.layers.13.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.710947673127521e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007497264887206256, "sensitivity": 0.5401092460648746 }, { "name": "model.layers.13.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.044582859321963e-05, "sensitivity": 1.5634469974958918 }, { "name": "model.layers.13.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.233140652511793e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.022433444741182e-05, "sensitivity": 0.6452758818108215 }, { "name": "model.layers.13.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0057850886369124e-05, "sensitivity": 1.2393276483625564 }, { "name": "model.layers.13.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.76686306380725e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006576689193025231, "sensitivity": 0.5234686715334745 }, { "name": "model.layers.13.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.202467920957133e-05, "sensitivity": 0.7241771981638798 }, { "name": "model.layers.13.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1245350606259308e-06, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007177807274274528, "sensitivity": 0.5274597427284188 }, { "name": "model.layers.13.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6647892051842064e-05, "sensitivity": 0.8248015733301655 }, { "name": "model.layers.13.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.402883852591913e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.717950261896476e-05, "sensitivity": 0.6403121828619804 }, { "name": "model.layers.13.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007011740235611796, "sensitivity": 0.5590657571429916 }, { "name": "model.layers.13.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.408408808056265e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007200231775641441, "sensitivity": 0.5367367028080665 }, { "name": "model.layers.13.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.98106998950243e-05, "sensitivity": 0.7439584363405798 }, { "name": "model.layers.13.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.688398457299627e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007016637828201056, "sensitivity": 0.5089717111989815 }, { "name": "model.layers.13.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.420414865715429e-05, "sensitivity": 0.6600545217049201 }, { "name": "model.layers.13.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.475464371964335e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007460989872924984, "sensitivity": 0.5729863193301702 }, { "name": "model.layers.13.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.857076757820323e-05, "sensitivity": 1.161018904821625 }, { "name": "model.layers.13.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.665043307904853e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.133363058324903e-05, "sensitivity": 0.75392578187197 }, { "name": "model.layers.13.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007242028368636966, "sensitivity": 0.5340912451292371 }, { "name": "model.layers.13.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.593145371880382e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007510663708671927, "sensitivity": 0.556822898814817 }, { "name": "model.layers.13.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006651420844718814, "sensitivity": 0.537471803954744 }, { "name": "model.layers.13.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.493305590993259e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006838254630565643, "sensitivity": 0.5046802066622342 }, { "name": "model.layers.13.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.852907634107396e-05, "sensitivity": 0.6019217572938944 }, { "name": "model.layers.13.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.288511258389917e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007051086286082864, "sensitivity": 0.5610005585605815 }, { "name": "model.layers.13.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9965805121464655e-05, "sensitivity": 0.803433359058456 }, { "name": "model.layers.13.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.426313348129042e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007107971468940377, "sensitivity": 0.5124178423144684 }, { "name": "model.layers.13.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.299755477812141e-05, "sensitivity": 0.7270705984012271 }, { "name": "model.layers.13.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.566921797457326e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007494239835068583, "sensitivity": 0.5402497718071926 }, { "name": "model.layers.13.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.822919411002658e-05, "sensitivity": 0.6355970953416358 }, { "name": "model.layers.13.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.276121666815015e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.054139157640748e-05, "sensitivity": 0.8598011770048394 }, { "name": "model.layers.13.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007017932366579771, "sensitivity": 0.5439270217786126 }, { "name": "model.layers.13.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.641583922828431e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000721562304534018, "sensitivity": 0.5559405541089271 }, { "name": "model.layers.13.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.438120908569545e-05, "sensitivity": 0.8176482380656251 }, { "name": "model.layers.13.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.880265805695672e-06, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.434034730773419e-05, "sensitivity": 0.634363924776348 }, { "name": "model.layers.13.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006877341656945646, "sensitivity": 0.5916884303959782 }, { "name": "model.layers.13.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.652644515270367e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007265376625582576, "sensitivity": 0.5367827979677593 }, { "name": "model.layers.13.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000657983124256134, "sensitivity": 0.5460789233439325 }, { "name": "model.layers.13.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.925389245931001e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006730548338964581, "sensitivity": 0.506115395223929 }, { "name": "model.layers.13.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007061773794703186, "sensitivity": 0.5564259195725404 }, { "name": "model.layers.13.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.850825684523443e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007307949708774686, "sensitivity": 0.5425764461643929 }, { "name": "model.layers.13.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1806369002442807e-05, "sensitivity": 1.2588698300122558 }, { "name": "model.layers.13.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.826149044376507e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.956540164537728e-05, "sensitivity": 0.6597936191563625 }, { "name": "model.layers.13.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000702214427292347, "sensitivity": 0.5583391136751825 }, { "name": "model.layers.13.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.766457545381854e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007205373840406537, "sensitivity": 0.5308899788893989 }, { "name": "model.layers.13.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006596962921321392, "sensitivity": 0.5708021702944801 }, { "name": "model.layers.13.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.959066129435087e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.942365896771662e-05, "sensitivity": 0.610312809173613 }, { "name": "model.layers.13.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006809655460529029, "sensitivity": 0.5829784180406694 }, { "name": "model.layers.13.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.538148227264173e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007335233385674655, "sensitivity": 0.5414627804128236 }, { "name": "model.layers.13.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9437337768031284e-05, "sensitivity": 0.9473804963533099 }, { "name": "model.layers.13.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.781747513035953e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.031511293258518e-05, "sensitivity": 0.8157532096467046 }, { "name": "model.layers.13.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007286419859156013, "sensitivity": 0.55683918945083 }, { "name": "model.layers.13.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.966896535232081e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007589161396026611, "sensitivity": 0.547234537338825 }, { "name": "model.layers.13.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.217305781319737e-05, "sensitivity": 0.6466447375250708 }, { "name": "model.layers.13.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.812196033934015e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007595595670863986, "sensitivity": 0.5166545779943985 }, { "name": "model.layers.13.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007004259969107807, "sensitivity": 0.5257467957320046 }, { "name": "model.layers.13.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.562853513969458e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007197301601991057, "sensitivity": 0.537577327987681 }, { "name": "model.layers.13.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006650143186561763, "sensitivity": 0.5064377206493583 }, { "name": "model.layers.13.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.008747277519433e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006847957847639918, "sensitivity": 0.5345804911308001 }, { "name": "model.layers.13.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.024158210493624e-05, "sensitivity": 0.6819080305607849 }, { "name": "model.layers.13.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.324264631984988e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006958772428333759, "sensitivity": 0.5503256189531173 }, { "name": "model.layers.13.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.181489152368158e-05, "sensitivity": 0.6775718163632408 }, { "name": "model.layers.13.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.206751545003499e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.401163409464061e-05, "sensitivity": 0.6667229417017793 }, { "name": "model.layers.13.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000679697550367564, "sensitivity": 0.5342462993443657 }, { "name": "model.layers.13.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.535166789944924e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007408942328765988, "sensitivity": 0.5462068178342693 }, { "name": "model.layers.13.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.790631257696077e-05, "sensitivity": 1.0133839198565133 }, { "name": "model.layers.13.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3056281886747456e-06, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.034310717950575e-05, "sensitivity": 1.0299393227124674 }, { "name": "model.layers.13.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000705104204826057, "sensitivity": 0.5440496919465222 }, { "name": "model.layers.13.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.808463695051614e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007264238665811718, "sensitivity": 0.5118185704971003 }, { "name": "model.layers.13.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.05301174800843e-05, "sensitivity": 0.8396026136695491 }, { "name": "model.layers.13.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.445295639423421e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006891838274896145, "sensitivity": 0.5279721094025157 }, { "name": "model.layers.13.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.228846905287355e-05, "sensitivity": 0.9172532659546316 }, { "name": "model.layers.13.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.713593165841303e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007203062996268272, "sensitivity": 0.5557897836704917 }, { "name": "model.layers.13.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.298576772678643e-05, "sensitivity": 0.710141172354313 }, { "name": "model.layers.13.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.525521030198433e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007246903842315078, "sensitivity": 0.5176168997223963 }, { "name": "model.layers.13.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.527234654640779e-05, "sensitivity": 0.6134318375746868 }, { "name": "model.layers.13.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.258151981659466e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007720102439634502, "sensitivity": 0.5889224034714904 }, { "name": "model.layers.13.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7006236602319404e-05, "sensitivity": 0.8686722991269762 }, { "name": "model.layers.13.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.012977564751054e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000646440195851028, "sensitivity": 0.5456577317382206 }, { "name": "model.layers.13.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006992561975494027, "sensitivity": 0.5907440903667776 }, { "name": "model.layers.13.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.626024742217851e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000746759760659188, "sensitivity": 0.5347358460399324 }, { "name": "model.layers.13.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.1390333131421357e-06, "sensitivity": 2.097142131232253 }, { "name": "model.layers.13.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.257828886191419e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006342150154523551, "sensitivity": 0.5867642382041823 }, { "name": "model.layers.13.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.397015386028215e-05, "sensitivity": 0.8487237990698264 }, { "name": "model.layers.13.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.588140533698606e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.674084579572082e-05, "sensitivity": 0.6347324397784037 }, { "name": "model.layers.13.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.297070649452507e-05, "sensitivity": 0.6412547881785828 }, { "name": "model.layers.13.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.56680981592217e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.577970634680241e-05, "sensitivity": 0.7378154670210785 }, { "name": "model.layers.13.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006760961259715259, "sensitivity": 0.5964924607680248 }, { "name": "model.layers.13.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.363969760059263e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006821169517934322, "sensitivity": 0.5617305142838773 }, { "name": "model.layers.13.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.047442366252653e-05, "sensitivity": 0.7186710208753743 }, { "name": "model.layers.13.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.652358024439309e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006946390494704247, "sensitivity": 0.5861683210423596 }, { "name": "model.layers.13.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000663559592794627, "sensitivity": 0.5114296921292939 }, { "name": "model.layers.13.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.967132210571435e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006816376699134707, "sensitivity": 0.5900383227126988 }, { "name": "model.layers.13.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006749517051503062, "sensitivity": 0.5549459888235914 }, { "name": "model.layers.13.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.209310186022776e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007015386363491416, "sensitivity": 0.5273847693322626 }, { "name": "model.layers.13.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7939520047511905e-05, "sensitivity": 0.6561468017299673 }, { "name": "model.layers.13.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.098159133216541e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006763784913346171, "sensitivity": 0.5317467416830755 }, { "name": "model.layers.13.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.870843233424239e-05, "sensitivity": 0.6232871830775193 }, { "name": "model.layers.13.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.80344214742945e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006642249645665288, "sensitivity": 0.5748447298135455 }, { "name": "model.layers.13.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006707921857014298, "sensitivity": 0.5798794080686547 }, { "name": "model.layers.13.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.265552201512037e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007067783735692501, "sensitivity": 0.5043957414094913 }, { "name": "model.layers.13.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006925404886715114, "sensitivity": 0.5412814125525611 }, { "name": "model.layers.13.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.361624400597066e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007243709405884147, "sensitivity": 0.5788457366618766 }, { "name": "model.layers.13.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.513237167382613e-05, "sensitivity": 0.9362962450225583 }, { "name": "model.layers.13.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.48554953133862e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007813346455805004, "sensitivity": 0.531018691177048 }, { "name": "model.layers.13.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006926512578502297, "sensitivity": 0.5244504915199122 }, { "name": "model.layers.13.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.271530992307817e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007068172562867403, "sensitivity": 0.5665036049315471 }, { "name": "model.layers.13.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000684476166497916, "sensitivity": 0.5860145444792346 }, { "name": "model.layers.13.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.396858225343749e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007099999347701669, "sensitivity": 0.5096769626380164 }, { "name": "model.layers.13.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.78506660531275e-05, "sensitivity": 0.8498135862858365 }, { "name": "model.layers.13.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.005404422168795e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.94886441831477e-05, "sensitivity": 0.612439734281197 }, { "name": "model.layers.13.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007072924636304379, "sensitivity": 0.5432184665027648 }, { "name": "model.layers.13.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.91239051775483e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007575529161840677, "sensitivity": 0.5926635555288478 }, { "name": "model.layers.13.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 7.023246325843502e-06, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.9417202565819025e-06, "sensitivity": 2.0990889568773845 }, { "name": "model.layers.13.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.988203722357866e-07, "sensitivity": 10.0 }, { "name": "model.layers.13.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.48803565025446e-06, "sensitivity": 2.105817594416845 }, { "name": "model.layers.13.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 5.592394700215664e-06, "sensitivity": 2.1730539557518287 }, { "name": "model.layers.13.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00016621100076008588, "sensitivity": 1.0622823339169334 }, { "name": "model.layers.13.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.2051654266542755e-05, "sensitivity": 1.5805417042889367 }, { "name": "model.layers.13.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.4553205700358376e-05, "sensitivity": 0.7561287938176162 }, { "name": "model.layers.13.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00027277428307570517, "sensitivity": 0.8600608511230464 }, { "name": "model.layers.14.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9268990298733115e-05, "sensitivity": 0.6322325016396934 }, { "name": "model.layers.14.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.612514766857203e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.099935853853822e-05, "sensitivity": 0.6065561518180216 }, { "name": "model.layers.14.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.182621291372925e-05, "sensitivity": 0.7905661764359047 }, { "name": "model.layers.14.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.665406431238807e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006953291594982147, "sensitivity": 0.5638319062949773 }, { "name": "model.layers.14.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006711941678076982, "sensitivity": 0.5258299497159836 }, { "name": "model.layers.14.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.256394158299372e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007004779763519764, "sensitivity": 0.5196989868154835 }, { "name": "model.layers.14.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.136541196610779e-05, "sensitivity": 0.7325720351847427 }, { "name": "model.layers.14.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.419115834432887e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007138288347050548, "sensitivity": 0.5232279602288801 }, { "name": "model.layers.14.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0114781616721302e-05, "sensitivity": 1.4089211817374212 }, { "name": "model.layers.14.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.764561592513928e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006350773619487882, "sensitivity": 0.548971630127804 }, { "name": "model.layers.14.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.358754762914032e-05, "sensitivity": 0.6707808366771462 }, { "name": "model.layers.14.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.295035970855679e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.626039248658344e-05, "sensitivity": 0.7282526931636053 }, { "name": "model.layers.14.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.521831528516486e-05, "sensitivity": 0.7615765748472758 }, { "name": "model.layers.14.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.99384600011399e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007584767299704254, "sensitivity": 0.5317295669804039 }, { "name": "model.layers.14.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0202062185271643e-05, "sensitivity": 1.4839098967390707 }, { "name": "model.layers.14.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.659653877250094e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006286596180871129, "sensitivity": 0.5130713167803612 }, { "name": "model.layers.14.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.646835415973328e-05, "sensitivity": 0.9761927693431046 }, { "name": "model.layers.14.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.526640277115803e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000634396041277796, "sensitivity": 0.5233997021729639 }, { "name": "model.layers.14.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.841189340571873e-05, "sensitivity": 0.7756194531827675 }, { "name": "model.layers.14.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.164216301840497e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006668863352388144, "sensitivity": 0.5696541462353261 }, { "name": "model.layers.14.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9959151258226484e-05, "sensitivity": 0.8673797323741852 }, { "name": "model.layers.14.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.190503765741596e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006811079801991582, "sensitivity": 0.555259330947314 }, { "name": "model.layers.14.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.44987085252069e-05, "sensitivity": 0.83294562661065 }, { "name": "model.layers.14.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.034919005694974e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007518300553783774, "sensitivity": 0.5832566696712773 }, { "name": "model.layers.14.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0158889381273184e-05, "sensitivity": 1.9870995959226678 }, { "name": "model.layers.14.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4533732155541657e-06, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.576657713390887e-05, "sensitivity": 0.6897397724933797 }, { "name": "model.layers.14.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.17035329923965e-05, "sensitivity": 0.8119272346240194 }, { "name": "model.layers.14.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.546405870722083e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.349570321617648e-05, "sensitivity": 0.7276692070714615 }, { "name": "model.layers.14.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.008361742715351e-05, "sensitivity": 0.6571453659062083 }, { "name": "model.layers.14.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.459359150947421e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000674002687446773, "sensitivity": 0.5249109866804119 }, { "name": "model.layers.14.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.815521581098437e-05, "sensitivity": 0.7648110755693622 }, { "name": "model.layers.14.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.845793111802777e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006603134097531438, "sensitivity": 0.5496829632191528 }, { "name": "model.layers.14.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0950413525279146e-05, "sensitivity": 1.7174246659667134 }, { "name": "model.layers.14.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.614212679778575e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00069773307768628, "sensitivity": 0.5500594645690452 }, { "name": "model.layers.14.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007036286406219006, "sensitivity": 0.5546038689569099 }, { "name": "model.layers.14.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.049206942610908e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007197256200015545, "sensitivity": 0.5375633341152615 }, { "name": "model.layers.14.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.03454936936032e-05, "sensitivity": 0.8128724431042207 }, { "name": "model.layers.14.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.427541165976436e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006928577786311507, "sensitivity": 0.5402750014968624 }, { "name": "model.layers.14.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0622289311140776e-05, "sensitivity": 0.9521343935491201 }, { "name": "model.layers.14.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.727292998220946e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007034544833004475, "sensitivity": 0.524078366802857 }, { "name": "model.layers.14.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.076219450624194e-05, "sensitivity": 1.2096129914076144 }, { "name": "model.layers.14.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.314782012850628e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000694778747856617, "sensitivity": 0.5680851335421734 }, { "name": "model.layers.14.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.165176455397159e-05, "sensitivity": 0.6773202865689553 }, { "name": "model.layers.14.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.102424888216774e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006895895348861814, "sensitivity": 0.5435347648055046 }, { "name": "model.layers.14.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.373008363880217e-05, "sensitivity": 0.6552417846466466 }, { "name": "model.layers.14.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.864644319648505e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007339939475059509, "sensitivity": 0.5317276674689597 }, { "name": "model.layers.14.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4876913054613397e-05, "sensitivity": 0.6604132150762192 }, { "name": "model.layers.14.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.782500807072211e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000646826985757798, "sensitivity": 0.5133493342609248 }, { "name": "model.layers.14.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006695803604088724, "sensitivity": 0.5488528584017298 }, { "name": "model.layers.14.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.217260306584649e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007011896814219654, "sensitivity": 0.5237389776281608 }, { "name": "model.layers.14.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.062864849809557e-05, "sensitivity": 1.02116531938687 }, { "name": "model.layers.14.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.544739221681084e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006979169556871057, "sensitivity": 0.5273634391402818 }, { "name": "model.layers.14.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1121813258796465e-05, "sensitivity": 1.5328731130574724 }, { "name": "model.layers.14.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.216898214006505e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006979742320254445, "sensitivity": 0.5874986646061198 }, { "name": "model.layers.14.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007048522820696235, "sensitivity": 0.5783158397346168 }, { "name": "model.layers.14.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.538946308864979e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007455623708665371, "sensitivity": 0.5415162373220693 }, { "name": "model.layers.14.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.026985283824615e-05, "sensitivity": 0.6070173589338724 }, { "name": "model.layers.14.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.694330636491941e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.111695984145626e-05, "sensitivity": 0.634308091507239 }, { "name": "model.layers.14.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.911339758313261e-05, "sensitivity": 0.6973177695591772 }, { "name": "model.layers.14.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.594434012185957e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006921462481841445, "sensitivity": 0.5520639981231106 }, { "name": "model.layers.14.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.929524195380509e-05, "sensitivity": 0.6216219172089211 }, { "name": "model.layers.14.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.540525419040932e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006809606566093862, "sensitivity": 0.552576858458307 }, { "name": "model.layers.14.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0014303370553534e-05, "sensitivity": 1.5043533379375933 }, { "name": "model.layers.14.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.854338951394311e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006361134583130479, "sensitivity": 0.5331196971126233 }, { "name": "model.layers.14.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.661091927322559e-05, "sensitivity": 0.9414730058696977 }, { "name": "model.layers.14.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.892927674722159e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006513199186883867, "sensitivity": 0.5202020703876561 }, { "name": "model.layers.14.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.358942482620478e-05, "sensitivity": 0.7408772260482536 }, { "name": "model.layers.14.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.926201194801251e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007590416353195906, "sensitivity": 0.5652752001521282 }, { "name": "model.layers.14.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.609877916867845e-05, "sensitivity": 0.6794691728587788 }, { "name": "model.layers.14.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.864686727363733e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000657767232041806, "sensitivity": 0.5431134262719224 }, { "name": "model.layers.14.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.664557102136314e-05, "sensitivity": 0.6824614023494072 }, { "name": "model.layers.14.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.928119316602533e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006928417133167386, "sensitivity": 0.5689968615973146 }, { "name": "model.layers.14.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.662355033564381e-05, "sensitivity": 0.6749726561825502 }, { "name": "model.layers.14.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.794695650569338e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006553381681442261, "sensitivity": 0.5604486985064434 }, { "name": "model.layers.14.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.154500442789868e-05, "sensitivity": 0.8022074811195576 }, { "name": "model.layers.14.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.735085662512574e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007084164535626769, "sensitivity": 0.5669361892482073 }, { "name": "model.layers.14.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.247959390748292e-05, "sensitivity": 0.9025124350299286 }, { "name": "model.layers.14.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.786871153963148e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007416463340632617, "sensitivity": 0.5700681885147375 }, { "name": "model.layers.14.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.620008960249834e-05, "sensitivity": 1.062774370364688 }, { "name": "model.layers.14.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.884919573873049e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006454241229221225, "sensitivity": 0.5545993414816167 }, { "name": "model.layers.14.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.287000021780841e-05, "sensitivity": 1.0925294053766819 }, { "name": "model.layers.14.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.673954319718177e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006292553152889013, "sensitivity": 0.5603250454598456 }, { "name": "model.layers.14.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.739732296206057e-05, "sensitivity": 0.6738209023267594 }, { "name": "model.layers.14.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.981619324302301e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006517893634736538, "sensitivity": 0.5122537780678572 }, { "name": "model.layers.14.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.948764010099694e-05, "sensitivity": 0.9349434467936886 }, { "name": "model.layers.14.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.127915526121797e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006851565558463335, "sensitivity": 0.5357605579627281 }, { "name": "model.layers.14.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006594301084987819, "sensitivity": 0.5297145633349688 }, { "name": "model.layers.14.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.126947482698597e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006962987827137113, "sensitivity": 0.5434787173233784 }, { "name": "model.layers.14.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.790558861917816e-05, "sensitivity": 0.7977648314111919 }, { "name": "model.layers.14.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.557503411386278e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.087414966605138e-05, "sensitivity": 1.2035736063937292 }, { "name": "model.layers.14.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.896287620998919e-05, "sensitivity": 0.9557525957032791 }, { "name": "model.layers.14.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.163539865156054e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.165869126562029e-05, "sensitivity": 0.7768014718071815 }, { "name": "model.layers.14.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6667991884751245e-05, "sensitivity": 0.7791439410461196 }, { "name": "model.layers.14.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.93195636611199e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006419676938094199, "sensitivity": 0.5586400002791453 }, { "name": "model.layers.14.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0632708482444286e-05, "sensitivity": 0.9451040512434385 }, { "name": "model.layers.14.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.179057550070866e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007082949741743505, "sensitivity": 0.5642976662145509 }, { "name": "model.layers.14.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.34800162515603e-05, "sensitivity": 0.8535398964823151 }, { "name": "model.layers.14.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.963929308767547e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007346257334575057, "sensitivity": 0.5932081785876594 }, { "name": "model.layers.14.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.92258402321022e-05, "sensitivity": 0.8044227687170202 }, { "name": "model.layers.14.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.314308507171518e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006685070693492889, "sensitivity": 0.5519966258729392 }, { "name": "model.layers.14.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.389514601323754e-05, "sensitivity": 0.7717215594853437 }, { "name": "model.layers.14.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.733729034953285e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007038887124508619, "sensitivity": 0.5385640215636607 }, { "name": "model.layers.14.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007099129725247622, "sensitivity": 0.5127105997568068 }, { "name": "model.layers.14.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.496597393379488e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000729805207811296, "sensitivity": 0.5351931010254082 }, { "name": "model.layers.14.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006477303104475141, "sensitivity": 0.5673332553655167 }, { "name": "model.layers.14.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.897617256778176e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006664302200078964, "sensitivity": 0.5379584180981677 }, { "name": "model.layers.14.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.409410707419738e-05, "sensitivity": 1.0849564193191377 }, { "name": "model.layers.14.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.692253009532578e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007320276345126331, "sensitivity": 0.5629348729903022 }, { "name": "model.layers.14.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.960026101092808e-05, "sensitivity": 0.747871766428573 }, { "name": "model.layers.14.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.359387043630704e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006975971045903862, "sensitivity": 0.542365921274386 }, { "name": "model.layers.14.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006844731396995485, "sensitivity": 0.5964761064349269 }, { "name": "model.layers.14.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.470443167927442e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.166138336993754e-05, "sensitivity": 0.6067881755765269 }, { "name": "model.layers.14.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.785465691587888e-05, "sensitivity": 0.9866881957447801 }, { "name": "model.layers.14.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.112950359238312e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006773656932637095, "sensitivity": 0.5441838736242453 }, { "name": "model.layers.14.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007127697463147342, "sensitivity": 0.5642506327808916 }, { "name": "model.layers.14.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.665838441222149e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.614334415644407e-05, "sensitivity": 0.9147937003731529 }, { "name": "model.layers.14.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.696304651792161e-05, "sensitivity": 1.1440209274858266 }, { "name": "model.layers.14.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.144169333310856e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006720131495967507, "sensitivity": 0.5369806850950664 }, { "name": "model.layers.14.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.904833597014658e-05, "sensitivity": 0.9660844180499147 }, { "name": "model.layers.14.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.331824238259287e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007056173635646701, "sensitivity": 0.5369505475446392 }, { "name": "model.layers.14.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.285589188337326e-05, "sensitivity": 0.6103461003620749 }, { "name": "model.layers.14.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.41807696158503e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007299637654796243, "sensitivity": 0.5321541192596554 }, { "name": "model.layers.14.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.835774936713278e-05, "sensitivity": 1.0005837654300196 }, { "name": "model.layers.14.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.325494723569136e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.119506724644452e-05, "sensitivity": 0.6549636907652477 }, { "name": "model.layers.14.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.878100637346506e-05, "sensitivity": 0.6482106603955617 }, { "name": "model.layers.14.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.057829864403175e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006944274064153433, "sensitivity": 0.5356833592698961 }, { "name": "model.layers.14.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.173417932586744e-05, "sensitivity": 0.871210710111938 }, { "name": "model.layers.14.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.188000381574966e-07, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.371442577801645e-05, "sensitivity": 0.6996696389132415 }, { "name": "model.layers.14.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 6.352083346428117e-06, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.110377863573376e-06, "sensitivity": 2.0992645157304297 }, { "name": "model.layers.14.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0223066055914387e-06, "sensitivity": 10.0 }, { "name": "model.layers.14.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 6.370866231009131e-06, "sensitivity": 1.3698959784549751 }, { "name": "model.layers.14.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 2.392660826444626e-05, "sensitivity": 1.4899908174045529 }, { "name": "model.layers.14.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.0001749361545080319, "sensitivity": 1.0545815329153554 }, { "name": "model.layers.14.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.3910425877838861e-05, "sensitivity": 1.5339453268740733 }, { "name": "model.layers.14.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.4254192946245894e-05, "sensitivity": 0.6604624794646152 }, { "name": "model.layers.14.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00027901766588911414, "sensitivity": 0.6704371725192947 }, { "name": "model.layers.15.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.994607272441499e-05, "sensitivity": 0.7222584130196478 }, { "name": "model.layers.15.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.210191259015119e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006863586604595184, "sensitivity": 0.518342683637294 }, { "name": "model.layers.15.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.186324026202783e-05, "sensitivity": 0.6702310736584287 }, { "name": "model.layers.15.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.850928002677392e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007217337260954082, "sensitivity": 0.5282199206508625 }, { "name": "model.layers.15.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0510174433875363e-05, "sensitivity": 1.2108000531645027 }, { "name": "model.layers.15.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.485654691663512e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006415427196770906, "sensitivity": 0.59872585789672 }, { "name": "model.layers.15.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.135923467809334e-05, "sensitivity": 0.6191004746580333 }, { "name": "model.layers.15.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.86376438352454e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007037408649921417, "sensitivity": 0.565493423806565 }, { "name": "model.layers.15.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7445326092420146e-05, "sensitivity": 1.0306020483751168 }, { "name": "model.layers.15.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.620583690164494e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006733631598763168, "sensitivity": 0.5365799198307969 }, { "name": "model.layers.15.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.739625703427009e-05, "sensitivity": 0.7714115888931953 }, { "name": "model.layers.15.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.04732804276864e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000661818019580096, "sensitivity": 0.5198987581125166 }, { "name": "model.layers.15.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8745437854668126e-05, "sensitivity": 0.6666344396106156 }, { "name": "model.layers.15.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.114966820154223e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006629982381127775, "sensitivity": 0.5073635727340801 }, { "name": "model.layers.15.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000672802678309381, "sensitivity": 0.5791580512962112 }, { "name": "model.layers.15.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.527840241687954e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006804637378081679, "sensitivity": 0.5488049421547193 }, { "name": "model.layers.15.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9845457144547254e-05, "sensitivity": 0.63695721345225 }, { "name": "model.layers.15.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.729562755936058e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00068604142870754, "sensitivity": 0.5443394920222941 }, { "name": "model.layers.15.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8989440731238574e-05, "sensitivity": 0.6978506966590899 }, { "name": "model.layers.15.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.454281447076937e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006981170154176652, "sensitivity": 0.5389050096924505 }, { "name": "model.layers.15.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.747718023485504e-05, "sensitivity": 0.786252079216689 }, { "name": "model.layers.15.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.584000627502974e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006807716563344002, "sensitivity": 0.5705604893601834 }, { "name": "model.layers.15.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8597142924554646e-05, "sensitivity": 0.8332342378279333 }, { "name": "model.layers.15.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.591416763512825e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006561046466231346, "sensitivity": 0.5961256026774857 }, { "name": "model.layers.15.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0144193765881937e-05, "sensitivity": 1.7203817598207916 }, { "name": "model.layers.15.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.055945161482668e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000653531402349472, "sensitivity": 0.5749766275734599 }, { "name": "model.layers.15.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0666636272799224e-05, "sensitivity": 0.7137081055869655 }, { "name": "model.layers.15.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.643423944296956e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007101005176082253, "sensitivity": 0.5385740128448679 }, { "name": "model.layers.15.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.98198821535334e-05, "sensitivity": 1.025194893273494 }, { "name": "model.layers.15.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.188038810250873e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006951174582354724, "sensitivity": 0.5292173069541033 }, { "name": "model.layers.15.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.816874808166176e-06, "sensitivity": 1.3075019287924385 }, { "name": "model.layers.15.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.159547751849459e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006726091960445046, "sensitivity": 0.5345230448306958 }, { "name": "model.layers.15.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0520192518015392e-05, "sensitivity": 1.2512583744645422 }, { "name": "model.layers.15.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.449577085732017e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006421219441108406, "sensitivity": 0.559220839342183 }, { "name": "model.layers.15.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9351586969569325e-05, "sensitivity": 0.9717988654598315 }, { "name": "model.layers.15.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.250061801438278e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000680600933264941, "sensitivity": 0.5159049905162431 }, { "name": "model.layers.15.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0244619817240164e-05, "sensitivity": 0.6952996618115642 }, { "name": "model.layers.15.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.026630441941961e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007048847037367523, "sensitivity": 0.5357826490622595 }, { "name": "model.layers.15.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.183987716212869e-05, "sensitivity": 0.6837694887297263 }, { "name": "model.layers.15.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.487121027021203e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007006459636613727, "sensitivity": 0.5345927794970369 }, { "name": "model.layers.15.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0780198863358237e-05, "sensitivity": 1.8155627927458127 }, { "name": "model.layers.15.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.136965566838626e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006870089564472437, "sensitivity": 0.5050264926049329 }, { "name": "model.layers.15.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006763748824596405, "sensitivity": 0.5270647197797189 }, { "name": "model.layers.15.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.412203106265224e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006908592185936868, "sensitivity": 0.5214844764533157 }, { "name": "model.layers.15.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0896716958086472e-05, "sensitivity": 1.4311009622013884 }, { "name": "model.layers.15.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.667755994589243e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9597063227556646e-05, "sensitivity": 0.6374442748788326 }, { "name": "model.layers.15.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.868739026482217e-05, "sensitivity": 0.7722726482422284 }, { "name": "model.layers.15.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.395239324774593e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006808950565755367, "sensitivity": 0.5757904912637354 }, { "name": "model.layers.15.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6833185226423666e-05, "sensitivity": 0.7538190644562284 }, { "name": "model.layers.15.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.309298896667315e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006401796126738191, "sensitivity": 0.5275963623757483 }, { "name": "model.layers.15.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0073348676087335e-05, "sensitivity": 1.7188261359347217 }, { "name": "model.layers.15.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.33527804438927e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000663451268337667, "sensitivity": 0.5678399960370867 }, { "name": "model.layers.15.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006718876538798213, "sensitivity": 0.5371554134519129 }, { "name": "model.layers.15.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.483032848336734e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006889407522976398, "sensitivity": 0.5527496592720551 }, { "name": "model.layers.15.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0673548786144238e-05, "sensitivity": 1.2875203068578505 }, { "name": "model.layers.15.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.865850193411461e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7259032473666593e-05, "sensitivity": 0.6666493278011713 }, { "name": "model.layers.15.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006617532926611602, "sensitivity": 0.5308410418079771 }, { "name": "model.layers.15.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.961376470826508e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006734427297487855, "sensitivity": 0.52839117975544 }, { "name": "model.layers.15.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6158674851758406e-05, "sensitivity": 1.0869032836146342 }, { "name": "model.layers.15.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.632328108935326e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.667746518156491e-05, "sensitivity": 0.6334351516311424 }, { "name": "model.layers.15.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006979623576626182, "sensitivity": 0.5950335926767372 }, { "name": "model.layers.15.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.470006610470591e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007059215568006039, "sensitivity": 0.5380353412458824 }, { "name": "model.layers.15.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0474260307091754e-05, "sensitivity": 1.488778685828328 }, { "name": "model.layers.15.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.94450534410862e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006677600322291255, "sensitivity": 0.5592764205978438 }, { "name": "model.layers.15.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.966002936474979e-05, "sensitivity": 0.719210013377719 }, { "name": "model.layers.15.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.546755457748077e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007064248202368617, "sensitivity": 0.5144651927973993 }, { "name": "model.layers.15.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007394430576823652, "sensitivity": 0.5873456447112639 }, { "name": "model.layers.15.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.407742259601946e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007494264282286167, "sensitivity": 0.5268109764475678 }, { "name": "model.layers.15.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.671260805684142e-05, "sensitivity": 0.8382725426594132 }, { "name": "model.layers.15.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.226919365166395e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006523224292322993, "sensitivity": 0.5063427715694083 }, { "name": "model.layers.15.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.225942343007773e-05, "sensitivity": 0.8937317281002206 }, { "name": "model.layers.15.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.294214358604222e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007095427718013525, "sensitivity": 0.5632144840016122 }, { "name": "model.layers.15.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.29457863396965e-05, "sensitivity": 0.6267379069456496 }, { "name": "model.layers.15.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.732716428814456e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007197781233116984, "sensitivity": 0.5218558477672534 }, { "name": "model.layers.15.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.552562263095751e-05, "sensitivity": 0.6168767905555625 }, { "name": "model.layers.15.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.245574806802324e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007641931879334152, "sensitivity": 0.5653564038807891 }, { "name": "model.layers.15.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007112567545846105, "sensitivity": 0.539255058865258 }, { "name": "model.layers.15.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.823223657193012e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007275845855474472, "sensitivity": 0.5039875679866103 }, { "name": "model.layers.15.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.098483572714031e-05, "sensitivity": 0.6875188267575335 }, { "name": "model.layers.15.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.683962965325918e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007036597235128284, "sensitivity": 0.5887076964266216 }, { "name": "model.layers.15.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006289802258834243, "sensitivity": 0.5617961074733278 }, { "name": "model.layers.15.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.364828888967168e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006421259604394436, "sensitivity": 0.5574332805594381 }, { "name": "model.layers.15.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007081645308062434, "sensitivity": 0.5533160957196352 }, { "name": "model.layers.15.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.587309826500132e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007438319153152406, "sensitivity": 0.539178313024078 }, { "name": "model.layers.15.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006866293260827661, "sensitivity": 0.5195799216321421 }, { "name": "model.layers.15.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.770687832613476e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006985652144066989, "sensitivity": 0.5522743220937621 }, { "name": "model.layers.15.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.700884503312409e-05, "sensitivity": 0.9246220210228486 }, { "name": "model.layers.15.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.524982154587633e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006441748701035976, "sensitivity": 0.5485950780941632 }, { "name": "model.layers.15.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.634455010294914e-05, "sensitivity": 1.0750183397882769 }, { "name": "model.layers.15.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.878034698980628e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006670739385299385, "sensitivity": 0.5276572932385426 }, { "name": "model.layers.15.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.919231625739485e-05, "sensitivity": 0.7827719011553838 }, { "name": "model.layers.15.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.512183290396933e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006541367620229721, "sensitivity": 0.5387953270855158 }, { "name": "model.layers.15.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.147424574010074e-05, "sensitivity": 0.8302693002861459 }, { "name": "model.layers.15.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.08785137248924e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007045291131362319, "sensitivity": 0.5367284826530241 }, { "name": "model.layers.15.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6669668992981315e-05, "sensitivity": 0.6926407968959543 }, { "name": "model.layers.15.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.408863555407152e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006370587507262826, "sensitivity": 0.5247276587992393 }, { "name": "model.layers.15.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8764253481058404e-05, "sensitivity": 0.8065787408252236 }, { "name": "model.layers.15.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.026267556080711e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006722203688696027, "sensitivity": 0.5203201471665125 }, { "name": "model.layers.15.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.932779095019214e-05, "sensitivity": 1.0668083518978788 }, { "name": "model.layers.15.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.539365813296172e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007011410198174417, "sensitivity": 0.5695020308030534 }, { "name": "model.layers.15.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8839719713432714e-05, "sensitivity": 0.7055598541044223 }, { "name": "model.layers.15.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.34205321148329e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006674338364973664, "sensitivity": 0.5631078052383575 }, { "name": "model.layers.15.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9319725551176816e-05, "sensitivity": 0.639544607400257 }, { "name": "model.layers.15.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.43709142877924e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006768115563318133, "sensitivity": 0.534157741924123 }, { "name": "model.layers.15.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006892151432111859, "sensitivity": 0.5942508892076761 }, { "name": "model.layers.15.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.678495765299886e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007084048120304942, "sensitivity": 0.5989733750231335 }, { "name": "model.layers.15.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.110197864472866e-05, "sensitivity": 0.6921747725382019 }, { "name": "model.layers.15.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.737528105484671e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.469769141403958e-05, "sensitivity": 0.602647106585502 }, { "name": "model.layers.15.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.861670069862157e-05, "sensitivity": 1.043134778401197 }, { "name": "model.layers.15.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.943351079120475e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.025646143825725e-05, "sensitivity": 0.6987595632930697 }, { "name": "model.layers.15.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007297468837350607, "sensitivity": 0.5233160240022272 }, { "name": "model.layers.15.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.268998842846486e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007600678945891559, "sensitivity": 0.5305339803931144 }, { "name": "model.layers.15.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.288022268563509e-05, "sensitivity": 0.8208959248151685 }, { "name": "model.layers.15.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.275188522726239e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007533053867518902, "sensitivity": 0.5982201714242442 }, { "name": "model.layers.15.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.874945054529235e-05, "sensitivity": 0.8431647132029618 }, { "name": "model.layers.15.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.83655798638938e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006629276904277503, "sensitivity": 0.5401363920314699 }, { "name": "model.layers.15.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.249347643461078e-05, "sensitivity": 0.8622206410447418 }, { "name": "model.layers.15.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.814325388404541e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007317927083931863, "sensitivity": 0.5590407574600169 }, { "name": "model.layers.15.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.926871017436497e-05, "sensitivity": 0.6689311863095654 }, { "name": "model.layers.15.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.633374027842365e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006637400947511196, "sensitivity": 0.5286108844087258 }, { "name": "model.layers.15.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.174673762870952e-05, "sensitivity": 0.6073003466206639 }, { "name": "model.layers.15.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.652938964180066e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007275479729287326, "sensitivity": 0.5544971107411215 }, { "name": "model.layers.15.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006651929579675198, "sensitivity": 0.5109869361719566 }, { "name": "model.layers.15.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.557578444699175e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006787145393900573, "sensitivity": 0.551704128326464 }, { "name": "model.layers.15.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.017522117763292e-05, "sensitivity": 1.3252179388578544 }, { "name": "model.layers.15.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.189831651681743e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006417500553652644, "sensitivity": 0.57655312726986 }, { "name": "model.layers.15.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.915821748203598e-05, "sensitivity": 0.809203465233935 }, { "name": "model.layers.15.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.093369163158059e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006627162802033126, "sensitivity": 0.537636664880039 }, { "name": "model.layers.15.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 5.068502105132211e-06, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.096842990795267e-06, "sensitivity": 2.0993028904456734 }, { "name": "model.layers.15.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.946851840439194e-07, "sensitivity": 10.0 }, { "name": "model.layers.15.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.624228389118798e-06, "sensitivity": 2.1060861603328584 }, { "name": "model.layers.15.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 2.8612088499357924e-05, "sensitivity": 1.3700640298838076 }, { "name": "model.layers.15.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00018407079915050417, "sensitivity": 0.9051123402210709 }, { "name": "model.layers.15.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.3551402844313998e-05, "sensitivity": 1.5183660563573949 }, { "name": "model.layers.15.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.501047053257935e-05, "sensitivity": 0.7320857509881563 }, { "name": "model.layers.15.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 2, "mse": 0.0032918842043727636, "sensitivity": 0.584650092642997 }, { "name": "model.layers.16.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.224007665878162e-05, "sensitivity": 0.7622516027190953 }, { "name": "model.layers.16.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.99677400461951e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007168391020968556, "sensitivity": 0.5248118613157358 }, { "name": "model.layers.16.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.051249637384899e-05, "sensitivity": 1.8241192307702867 }, { "name": "model.layers.16.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.164833052935137e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006576239829882979, "sensitivity": 0.5377808014534956 }, { "name": "model.layers.16.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.947776298853569e-05, "sensitivity": 1.072660481692607 }, { "name": "model.layers.16.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.032513510945137e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000680762343108654, "sensitivity": 0.5396033806421399 }, { "name": "model.layers.16.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.293645856203511e-05, "sensitivity": 1.0082123755705465 }, { "name": "model.layers.16.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.507331136162975e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.532444240292534e-05, "sensitivity": 0.6340592480211182 }, { "name": "model.layers.16.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7442863180767745e-05, "sensitivity": 0.6334673248840488 }, { "name": "model.layers.16.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.202473628036387e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006440478609874845, "sensitivity": 0.5107838089027863 }, { "name": "model.layers.16.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7089571782853454e-05, "sensitivity": 1.0556867626329776 }, { "name": "model.layers.16.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.137928494354128e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006477142451331019, "sensitivity": 0.5330219545914051 }, { "name": "model.layers.16.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0870207916013896e-05, "sensitivity": 1.7621189401581063 }, { "name": "model.layers.16.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.239447429834399e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.120756734162569e-05, "sensitivity": 0.6737119427416391 }, { "name": "model.layers.16.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0558631957974285e-05, "sensitivity": 0.7939732005783025 }, { "name": "model.layers.16.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.324566470539139e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006884997710585594, "sensitivity": 0.5588543475228145 }, { "name": "model.layers.16.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.381147250067443e-05, "sensitivity": 0.6220324405777625 }, { "name": "model.layers.16.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.922842885614955e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007228156318888068, "sensitivity": 0.5518675114024028 }, { "name": "model.layers.16.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9699486882891506e-05, "sensitivity": 0.6727988508507179 }, { "name": "model.layers.16.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.631183850913658e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006835697568021715, "sensitivity": 0.5131521128650551 }, { "name": "model.layers.16.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9316236729500815e-05, "sensitivity": 0.7460597962414103 }, { "name": "model.layers.16.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.25487189154228e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006735550705343485, "sensitivity": 0.5416022796092522 }, { "name": "model.layers.16.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1173951861565001e-05, "sensitivity": 1.7284898131136477 }, { "name": "model.layers.16.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.201310268101224e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006732711335644126, "sensitivity": 0.5582300274660316 }, { "name": "model.layers.16.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8580080803949386e-05, "sensitivity": 0.6136015476678722 }, { "name": "model.layers.16.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.314456868494744e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006676713819615543, "sensitivity": 0.5699443393051762 }, { "name": "model.layers.16.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0367940376454499e-05, "sensitivity": 1.6039350455898633 }, { "name": "model.layers.16.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.007592219248181e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006729345768690109, "sensitivity": 0.5601310176753704 }, { "name": "model.layers.16.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.173380825202912e-05, "sensitivity": 0.858333705560047 }, { "name": "model.layers.16.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.856692718632985e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006922126631252468, "sensitivity": 0.5409565586988434 }, { "name": "model.layers.16.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.026065238984302e-05, "sensitivity": 1.1452213011450105 }, { "name": "model.layers.16.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.940617135522189e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006945847999304533, "sensitivity": 0.562063339507686 }, { "name": "model.layers.16.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8704346884042025e-05, "sensitivity": 0.923586780676567 }, { "name": "model.layers.16.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.747977062739665e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006712715839967132, "sensitivity": 0.5812517232280876 }, { "name": "model.layers.16.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.755518941441551e-05, "sensitivity": 0.8033317836243861 }, { "name": "model.layers.16.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.553217986038362e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006370461778715253, "sensitivity": 0.5558259148968988 }, { "name": "model.layers.16.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.466080958489329e-05, "sensitivity": 0.6056524111878661 }, { "name": "model.layers.16.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.011951197455346e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007561428938060999, "sensitivity": 0.5286861239144487 }, { "name": "model.layers.16.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.020119326421991e-05, "sensitivity": 0.820036150750267 }, { "name": "model.layers.16.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.616886594201787e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006675976328551769, "sensitivity": 0.5637410897346853 }, { "name": "model.layers.16.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.606413469649851e-05, "sensitivity": 1.0206227700385815 }, { "name": "model.layers.16.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.257133691178751e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006100676255300641, "sensitivity": 0.5533873770644027 }, { "name": "model.layers.16.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.810125730931759e-05, "sensitivity": 0.7463528146936594 }, { "name": "model.layers.16.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.358858399835299e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006521352916024625, "sensitivity": 0.5029004422347407 }, { "name": "model.layers.16.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.744745067204349e-05, "sensitivity": 0.9352001394445356 }, { "name": "model.layers.16.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.2455649185722e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006613858859054744, "sensitivity": 0.5298392671548894 }, { "name": "model.layers.16.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0113650205312297e-05, "sensitivity": 1.5449250102156142 }, { "name": "model.layers.16.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.553285629706807e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006284556584432721, "sensitivity": 0.5135888500017207 }, { "name": "model.layers.16.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1078844181611203e-05, "sensitivity": 1.3667565224461504 }, { "name": "model.layers.16.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.398203140633996e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006851805374026299, "sensitivity": 0.5227850398796935 }, { "name": "model.layers.16.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.2076353616284905e-06, "sensitivity": 2.0972363005800454 }, { "name": "model.layers.16.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.479129979197751e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5939693993423134e-05, "sensitivity": 0.6324605288097305 }, { "name": "model.layers.16.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0669080438674428e-05, "sensitivity": 1.3293120152573434 }, { "name": "model.layers.16.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.307152489171131e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006704523111693561, "sensitivity": 0.5361192619787151 }, { "name": "model.layers.16.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8492543757893145e-05, "sensitivity": 0.9211756706834802 }, { "name": "model.layers.16.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.983250730423606e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006758067756891251, "sensitivity": 0.5063142945484759 }, { "name": "model.layers.16.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0047905561805237e-05, "sensitivity": 1.5393984048174307 }, { "name": "model.layers.16.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.586315516367904e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.541136488318443e-05, "sensitivity": 0.8025940347922969 }, { "name": "model.layers.16.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9697613323805854e-05, "sensitivity": 0.7363442024025337 }, { "name": "model.layers.16.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.463551471824758e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006952823023311794, "sensitivity": 0.5672486211418577 }, { "name": "model.layers.16.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.38408018858172e-05, "sensitivity": 0.6606060479067855 }, { "name": "model.layers.16.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.18600972504646e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007339600706472993, "sensitivity": 0.5559623614159559 }, { "name": "model.layers.16.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.814270116388798e-05, "sensitivity": 0.6805270400195826 }, { "name": "model.layers.16.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.475040663644904e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006427834159694612, "sensitivity": 0.5484675777670553 }, { "name": "model.layers.16.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.84356821491383e-05, "sensitivity": 0.6145359931167024 }, { "name": "model.layers.16.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.211458523670444e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006382351275533438, "sensitivity": 0.5370975642277902 }, { "name": "model.layers.16.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.940280971117318e-05, "sensitivity": 0.7462425145519284 }, { "name": "model.layers.16.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.605328053410631e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006665957043878734, "sensitivity": 0.5283042243086359 }, { "name": "model.layers.16.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.752585275331512e-05, "sensitivity": 0.7379784692332823 }, { "name": "model.layers.16.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.310942808340769e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006447491468861699, "sensitivity": 0.5550016903948796 }, { "name": "model.layers.16.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.645742567139678e-05, "sensitivity": 1.172285555627954 }, { "name": "model.layers.16.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.88688749303401e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7911762269213796e-05, "sensitivity": 0.6309909780526053 }, { "name": "model.layers.16.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.300717359408736e-05, "sensitivity": 0.8664109912423372 }, { "name": "model.layers.16.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.887637482577702e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007167315925471485, "sensitivity": 0.5505814863130034 }, { "name": "model.layers.16.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9461279306560755e-05, "sensitivity": 0.8615633044385057 }, { "name": "model.layers.16.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.572195386273961e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006708133732900023, "sensitivity": 0.5144160595317004 }, { "name": "model.layers.16.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1186213669134304e-05, "sensitivity": 1.3380817644223888 }, { "name": "model.layers.16.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.396262731163006e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.253429455682635e-05, "sensitivity": 0.6534634755127516 }, { "name": "model.layers.16.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.16069883108139e-05, "sensitivity": 0.740252352819635 }, { "name": "model.layers.16.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.485831249847251e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000720726209692657, "sensitivity": 0.5380575499851006 }, { "name": "model.layers.16.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.470935477409512e-05, "sensitivity": 0.6533798209359893 }, { "name": "model.layers.16.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.829277481301688e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007430700352415442, "sensitivity": 0.5148189559091219 }, { "name": "model.layers.16.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.958662222838029e-05, "sensitivity": 1.0275289255908038 }, { "name": "model.layers.16.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.302530550783558e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006989281973801553, "sensitivity": 0.5293197836080618 }, { "name": "model.layers.16.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.243934330996126e-05, "sensitivity": 0.8929478861105288 }, { "name": "model.layers.16.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.634471674260567e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007526380941271782, "sensitivity": 0.5967748440939219 }, { "name": "model.layers.16.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.233464955585077e-05, "sensitivity": 0.8087718861007984 }, { "name": "model.layers.16.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.27963901883777e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007232515490613878, "sensitivity": 0.5286389244954715 }, { "name": "model.layers.16.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006920963060110807, "sensitivity": 0.5512342099738426 }, { "name": "model.layers.16.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.507995635729458e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.34663738310337e-05, "sensitivity": 0.6064900909221628 }, { "name": "model.layers.16.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.940424671280198e-05, "sensitivity": 0.9071120025872312 }, { "name": "model.layers.16.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.515417112495925e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006915563717484474, "sensitivity": 0.5518233297597829 }, { "name": "model.layers.16.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006993203423917294, "sensitivity": 0.543731819991625 }, { "name": "model.layers.16.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.624755997108878e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007003572536632419, "sensitivity": 0.5216498852022691 }, { "name": "model.layers.16.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.893694469705224e-05, "sensitivity": 1.163535719994436 }, { "name": "model.layers.16.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.983559839885856e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006353619392029941, "sensitivity": 0.5363005239013103 }, { "name": "model.layers.16.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.980298010399565e-05, "sensitivity": 0.6862804858627635 }, { "name": "model.layers.16.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.854658067823038e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006889039068482816, "sensitivity": 0.5494394972806245 }, { "name": "model.layers.16.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.916407098993659e-05, "sensitivity": 0.86314044657983 }, { "name": "model.layers.16.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.821698548264976e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006539043388329446, "sensitivity": 0.5379688237251222 }, { "name": "model.layers.16.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0370730706199538e-05, "sensitivity": 1.2308131489237273 }, { "name": "model.layers.16.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.241212642838946e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006290421588346362, "sensitivity": 0.5582040820541858 }, { "name": "model.layers.16.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.180873606353998e-05, "sensitivity": 0.6038814559336257 }, { "name": "model.layers.16.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.1667221845928e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007383663905784488, "sensitivity": 0.5364714927832408 }, { "name": "model.layers.16.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.622814205707982e-05, "sensitivity": 0.7941584887227643 }, { "name": "model.layers.16.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.910745469212998e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006423332961276174, "sensitivity": 0.5263160228557003 }, { "name": "model.layers.16.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.965585296507925e-05, "sensitivity": 1.0211933124618053 }, { "name": "model.layers.16.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.19108675437019e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000695787079166621, "sensitivity": 0.5304205640076206 }, { "name": "model.layers.16.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.85659799980931e-05, "sensitivity": 0.8198009253999988 }, { "name": "model.layers.16.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.803263315508957e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006479301955550909, "sensitivity": 0.5669179715038588 }, { "name": "model.layers.16.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.010620326269418e-05, "sensitivity": 1.284011090424262 }, { "name": "model.layers.16.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.59567831462482e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006377120735123754, "sensitivity": 0.573647598485387 }, { "name": "model.layers.16.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0660477528290357e-05, "sensitivity": 1.3599113478203024 }, { "name": "model.layers.16.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.004345323162852e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.017376290401444e-05, "sensitivity": 0.6059890860384428 }, { "name": "model.layers.16.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0238740843487903e-05, "sensitivity": 0.6204496658100933 }, { "name": "model.layers.16.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.369016318785725e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006777895032428205, "sensitivity": 0.5014591099880235 }, { "name": "model.layers.16.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.2407461983675603e-06, "sensitivity": 2.096873391205192 }, { "name": "model.layers.16.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.220504928933224e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006529337260872126, "sensitivity": 0.5163212813682768 }, { "name": "model.layers.16.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3890338525234256e-06, "sensitivity": 2.097715419328279 }, { "name": "model.layers.16.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.730141528052627e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.0213533641945105e-05, "sensitivity": 1.52005590177854 }, { "name": "model.layers.16.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0216695045528468e-05, "sensitivity": 1.5350672538108254 }, { "name": "model.layers.16.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.185695724525431e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006312135374173522, "sensitivity": 0.53095998603451 }, { "name": "model.layers.16.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.834804586716928e-06, "sensitivity": 1.5334269603074893 }, { "name": "model.layers.16.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.244143264666491e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006616059690713882, "sensitivity": 0.5689208304008302 }, { "name": "model.layers.16.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0624817150528543e-05, "sensitivity": 1.4982229481795808 }, { "name": "model.layers.16.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.692062465343042e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9069057897431776e-05, "sensitivity": 0.6119276156103577 }, { "name": "model.layers.16.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.164208753034472e-05, "sensitivity": 0.8475410257202107 }, { "name": "model.layers.16.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.746303142790566e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006919795414432883, "sensitivity": 0.5205755812746475 }, { "name": "model.layers.16.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 4.747220373246819e-06, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.442612185404869e-06, "sensitivity": 2.1001073616711112 }, { "name": "model.layers.16.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.374741019499197e-07, "sensitivity": 10.0 }, { "name": "model.layers.16.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 7.257636298163561e-06, "sensitivity": 1.6828009108730246 }, { "name": "model.layers.16.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 2.71807311946759e-05, "sensitivity": 1.797561079238254 }, { "name": "model.layers.16.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00018194885342381895, "sensitivity": 1.1874689527676952 }, { "name": "model.layers.16.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.416656141373096e-05, "sensitivity": 1.8298546480569817 }, { "name": "model.layers.16.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 2, "mse": 0.0006541988113895059, "sensitivity": 0.5777880551599879 }, { "name": "model.layers.16.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002798729983624071, "sensitivity": 0.790146251878931 }, { "name": "model.layers.17.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.461681212182157e-05, "sensitivity": 1.151454438043213 }, { "name": "model.layers.17.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.915574992191978e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.100803537061438e-05, "sensitivity": 0.6356711407159794 }, { "name": "model.layers.17.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.763858644058928e-05, "sensitivity": 1.174517656863229 }, { "name": "model.layers.17.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.190096423277282e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006631982396356761, "sensitivity": 0.5995058068510188 }, { "name": "model.layers.17.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.942638381384313e-05, "sensitivity": 0.7830205244900724 }, { "name": "model.layers.17.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.34068499039131e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000649512221571058, "sensitivity": 0.5408508486887205 }, { "name": "model.layers.17.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.694153050077148e-06, "sensitivity": 1.5983556206892835 }, { "name": "model.layers.17.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.686628128387383e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006020100554451346, "sensitivity": 0.5458063913954572 }, { "name": "model.layers.17.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7007760915439576e-05, "sensitivity": 0.7337705164741607 }, { "name": "model.layers.17.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.524095397253404e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006283242255449295, "sensitivity": 0.5857165805012349 }, { "name": "model.layers.17.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0138053767150268e-05, "sensitivity": 1.9167523058124152 }, { "name": "model.layers.17.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.02690931827965e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006396063836291432, "sensitivity": 0.5439536042420762 }, { "name": "model.layers.17.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.695772051694803e-05, "sensitivity": 0.9432880318128534 }, { "name": "model.layers.17.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.699951882183086e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006466718623414636, "sensitivity": 0.5168436062189641 }, { "name": "model.layers.17.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.427567859645933e-05, "sensitivity": 0.6621922535336049 }, { "name": "model.layers.17.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.201458060990262e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007266198517754674, "sensitivity": 0.5931764717354802 }, { "name": "model.layers.17.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000658202450722456, "sensitivity": 0.5742352138749492 }, { "name": "model.layers.17.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.731917778779462e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006595224840566516, "sensitivity": 0.5249970578192116 }, { "name": "model.layers.17.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.664453419740312e-05, "sensitivity": 0.7764982184144552 }, { "name": "model.layers.17.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.434507776655664e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006113043637014925, "sensitivity": 0.5226617186738426 }, { "name": "model.layers.17.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.879476884729229e-05, "sensitivity": 0.6170873723547927 }, { "name": "model.layers.17.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.265488536882913e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006203338271006942, "sensitivity": 0.5675976918542521 }, { "name": "model.layers.17.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9159850934520364e-05, "sensitivity": 1.026000970023668 }, { "name": "model.layers.17.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.800379873719066e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006389596965163946, "sensitivity": 0.5482815266911795 }, { "name": "model.layers.17.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.08663831371814e-05, "sensitivity": 0.6288514674864552 }, { "name": "model.layers.17.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.346105803662795e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006402774015441537, "sensitivity": 0.5306204714186682 }, { "name": "model.layers.17.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.67998577025719e-05, "sensitivity": 0.8081746682443737 }, { "name": "model.layers.17.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.009775006532436e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006519716698676348, "sensitivity": 0.5540296055686726 }, { "name": "model.layers.17.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006623428780585527, "sensitivity": 0.5547119502242439 }, { "name": "model.layers.17.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.736190354989958e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006428458727896214, "sensitivity": 0.5615429345929436 }, { "name": "model.layers.17.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.774344754172489e-05, "sensitivity": 0.7919193025022436 }, { "name": "model.layers.17.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.553038360834762e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006519687594845891, "sensitivity": 0.5037889168940924 }, { "name": "model.layers.17.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006582130445167422, "sensitivity": 0.5884579386422247 }, { "name": "model.layers.17.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.47045226287446e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006305359420366585, "sensitivity": 0.5544184120270401 }, { "name": "model.layers.17.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.441049481509253e-05, "sensitivity": 0.6376701063898348 }, { "name": "model.layers.17.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.233214430219959e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007164077833294868, "sensitivity": 0.5338096264520903 }, { "name": "model.layers.17.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.715937732020393e-05, "sensitivity": 0.9172693707739412 }, { "name": "model.layers.17.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.651352689208579e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005984754534438252, "sensitivity": 0.5336748171908345 }, { "name": "model.layers.17.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0892067621171009e-05, "sensitivity": 1.6817516014502076 }, { "name": "model.layers.17.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.447984901569725e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006777711096219718, "sensitivity": 0.5436274778331136 }, { "name": "model.layers.17.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.710002369596623e-05, "sensitivity": 0.7194716015062326 }, { "name": "model.layers.17.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.93953586758289e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.636378045892343e-05, "sensitivity": 0.6153335924527803 }, { "name": "model.layers.17.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.00907915213611e-05, "sensitivity": 0.620853623199941 }, { "name": "model.layers.17.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.194048864927026e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006885076873004436, "sensitivity": 0.533382873994215 }, { "name": "model.layers.17.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006961270119063556, "sensitivity": 0.5666537562609729 }, { "name": "model.layers.17.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.40997086520656e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007009388646110892, "sensitivity": 0.5703549361073157 }, { "name": "model.layers.17.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3439213236997603e-06, "sensitivity": 2.0976021677471124 }, { "name": "model.layers.17.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.894067953704507e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 9.732872058521025e-06, "sensitivity": 1.562903490334871 }, { "name": "model.layers.17.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.834762123413384e-05, "sensitivity": 0.9080809477354591 }, { "name": "model.layers.17.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.291977570072049e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.672841507475823e-05, "sensitivity": 0.7877390239504237 }, { "name": "model.layers.17.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.102569750510156e-05, "sensitivity": 0.6210772502689668 }, { "name": "model.layers.17.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.181667681128602e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006843460141681135, "sensitivity": 0.5509152805875681 }, { "name": "model.layers.17.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.276821659412235e-05, "sensitivity": 0.6587780713946526 }, { "name": "model.layers.17.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.800914889026899e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007179062813520432, "sensitivity": 0.5862407605159811 }, { "name": "model.layers.17.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006611388525925577, "sensitivity": 0.5252051398160225 }, { "name": "model.layers.17.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.713815992043237e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006474414258264005, "sensitivity": 0.5050988182100243 }, { "name": "model.layers.17.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.058056897018105e-05, "sensitivity": 1.177174087162951 }, { "name": "model.layers.17.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.875524150018464e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000650999543722719, "sensitivity": 0.5251301468706358 }, { "name": "model.layers.17.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0530514373385813e-05, "sensitivity": 1.5842469916583917 }, { "name": "model.layers.17.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.811603831622051e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7315977755934e-05, "sensitivity": 0.7436154565957124 }, { "name": "model.layers.17.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.847142165293917e-05, "sensitivity": 1.101884860574121 }, { "name": "model.layers.17.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.474450735069695e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006436347030103207, "sensitivity": 0.5322176757689444 }, { "name": "model.layers.17.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.93807635596022e-05, "sensitivity": 1.0370299242741041 }, { "name": "model.layers.17.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.254906566027785e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006772837368771434, "sensitivity": 0.5677893643499271 }, { "name": "model.layers.17.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.16779361735098e-05, "sensitivity": 0.9486640080449331 }, { "name": "model.layers.17.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.372735808530706e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.165822560433298e-05, "sensitivity": 1.0037833137942231 }, { "name": "model.layers.17.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.760196290793829e-05, "sensitivity": 0.7893227499325983 }, { "name": "model.layers.17.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.011619007040281e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006356735830195248, "sensitivity": 0.5258507519853087 }, { "name": "model.layers.17.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.834869443788193e-05, "sensitivity": 0.6837414910689024 }, { "name": "model.layers.17.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.291817271630862e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006791178020648658, "sensitivity": 0.5059063290458099 }, { "name": "model.layers.17.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0678835678845644e-05, "sensitivity": 1.8767796553629852 }, { "name": "model.layers.17.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.930635774755501e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.945742304902524e-05, "sensitivity": 0.7072075246606853 }, { "name": "model.layers.17.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.784354289062321e-05, "sensitivity": 0.8751870099338668 }, { "name": "model.layers.17.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.504887437586149e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006269905716180801, "sensitivity": 0.5295267307291349 }, { "name": "model.layers.17.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.142198981251568e-05, "sensitivity": 0.7658130700756512 }, { "name": "model.layers.17.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.061089490889572e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006967309745959938, "sensitivity": 0.5733702117559542 }, { "name": "model.layers.17.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.649836384691298e-05, "sensitivity": 0.645518020930572 }, { "name": "model.layers.17.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.31742318293982e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006117822485975921, "sensitivity": 0.5343230827658222 }, { "name": "model.layers.17.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8883637393591926e-05, "sensitivity": 0.7705049663845809 }, { "name": "model.layers.17.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.639845651079668e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006290716701187193, "sensitivity": 0.5574654041865902 }, { "name": "model.layers.17.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.342941196635365e-05, "sensitivity": 0.639438644382427 }, { "name": "model.layers.17.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.797791792858334e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006952762487344444, "sensitivity": 0.5359232275104066 }, { "name": "model.layers.17.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.054902041796595e-05, "sensitivity": 1.0202000668575857 }, { "name": "model.layers.17.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.129860364329943e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006589122349396348, "sensitivity": 0.5478949994605301 }, { "name": "model.layers.17.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000627960660494864, "sensitivity": 0.5781699387128405 }, { "name": "model.layers.17.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.897440473745519e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006212025764398277, "sensitivity": 0.541987038918099 }, { "name": "model.layers.17.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.67412753298413e-05, "sensitivity": 0.9378394397055718 }, { "name": "model.layers.17.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.182655170050566e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006428157212212682, "sensitivity": 0.5573615511785233 }, { "name": "model.layers.17.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6108878197846934e-05, "sensitivity": 0.7681429854688511 }, { "name": "model.layers.17.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.215909706952516e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006190197309479117, "sensitivity": 0.5421675364844715 }, { "name": "model.layers.17.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006322422996163368, "sensitivity": 0.5825416481090596 }, { "name": "model.layers.17.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.144218443499994e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000608837406616658, "sensitivity": 0.5627624371573587 }, { "name": "model.layers.17.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.821273953188211e-05, "sensitivity": 0.7563552375785675 }, { "name": "model.layers.17.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.227694022229116e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006587868556380272, "sensitivity": 0.5321168255039567 }, { "name": "model.layers.17.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.549153476953506e-05, "sensitivity": 0.6747816374028743 }, { "name": "model.layers.17.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.498210834455676e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.658980419160798e-05, "sensitivity": 0.6252292672736375 }, { "name": "model.layers.17.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.245174881769344e-05, "sensitivity": 0.6949560853123437 }, { "name": "model.layers.17.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.27837345948501e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006979770842008293, "sensitivity": 0.5594577157493668 }, { "name": "model.layers.17.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.071096140658483e-05, "sensitivity": 0.7457553190864783 }, { "name": "model.layers.17.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.893008048791671e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006663856329396367, "sensitivity": 0.545709366578931 }, { "name": "model.layers.17.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.301885878201574e-05, "sensitivity": 0.923478507635145 }, { "name": "model.layers.17.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.490065172532923e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007025778177194297, "sensitivity": 0.5621249183523455 }, { "name": "model.layers.17.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.129941175458953e-05, "sensitivity": 0.8983354546263549 }, { "name": "model.layers.17.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.473069333878811e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006853108061477542, "sensitivity": 0.5334267560694557 }, { "name": "model.layers.17.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.019386273692362e-05, "sensitivity": 0.710014859306038 }, { "name": "model.layers.17.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.708743853778287e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006713730981573462, "sensitivity": 0.5702314604031804 }, { "name": "model.layers.17.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0048500017728657e-05, "sensitivity": 0.925235090208558 }, { "name": "model.layers.17.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.170561613951577e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006477349670603871, "sensitivity": 0.5489651717916565 }, { "name": "model.layers.17.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0826550907222554e-05, "sensitivity": 1.1169045384933298 }, { "name": "model.layers.17.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.425049718927767e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006834546802565455, "sensitivity": 0.5195055495730968 }, { "name": "model.layers.17.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9187004808336496e-05, "sensitivity": 0.6806627344155791 }, { "name": "model.layers.17.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.8405438469199e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.882571713300422e-05, "sensitivity": 0.6556232375451173 }, { "name": "model.layers.17.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0958703569485806e-05, "sensitivity": 1.9618750655922863 }, { "name": "model.layers.17.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.005975817264698e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.017718624207191e-05, "sensitivity": 0.6963224927881758 }, { "name": "model.layers.17.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0493822628632188e-05, "sensitivity": 1.3500542214175666 }, { "name": "model.layers.17.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.978637886983051e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006500994204543531, "sensitivity": 0.5165258784337132 }, { "name": "model.layers.17.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0245995326840784e-05, "sensitivity": 1.3864155420644437 }, { "name": "model.layers.17.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.195719374270993e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006033016834408045, "sensitivity": 0.5876128691364909 }, { "name": "model.layers.17.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.776685429736972e-05, "sensitivity": 0.7260174543741545 }, { "name": "model.layers.17.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.955030471544887e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006350442999973893, "sensitivity": 0.5302609053864664 }, { "name": "model.layers.17.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006481326417997479, "sensitivity": 0.5699507435652847 }, { "name": "model.layers.17.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.010718263700255e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006273322505876422, "sensitivity": 0.5284880173368678 }, { "name": "model.layers.17.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.475819751969539e-06, "sensitivity": 1.4701865436142239 }, { "name": "model.layers.17.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.059678637233446e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005914315115660429, "sensitivity": 0.5495195233348713 }, { "name": "model.layers.17.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0014749932452105e-05, "sensitivity": 1.2056754242335344 }, { "name": "model.layers.17.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.880374030515668e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005961160641163588, "sensitivity": 0.5604861225924612 }, { "name": "model.layers.17.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.247349665500224e-05, "sensitivity": 0.6988311843576372 }, { "name": "model.layers.17.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.048560064504272e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006946692592464387, "sensitivity": 0.5204266215296154 }, { "name": "model.layers.17.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 4.2312321966164745e-06, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.283136382175144e-06, "sensitivity": 2.0994290748661903 }, { "name": "model.layers.17.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.502608241338748e-07, "sensitivity": 10.0 }, { "name": "model.layers.17.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.6655742456350708e-06, "sensitivity": 2.104987972588769 }, { "name": "model.layers.17.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 7.748869393253699e-06, "sensitivity": 2.1908353113184993 }, { "name": "model.layers.17.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00018019579874817282, "sensitivity": 0.9132328670365855 }, { "name": "model.layers.17.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.564079684612807e-05, "sensitivity": 1.0788967496537367 }, { "name": "model.layers.17.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.937926107435487e-05, "sensitivity": 0.657307615601148 }, { "name": "model.layers.17.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002681644109543413, "sensitivity": 0.6941153772929682 }, { "name": "model.layers.18.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3768755606142804e-05, "sensitivity": 1.0683910817319835 }, { "name": "model.layers.18.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.720752369597903e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006155906594358385, "sensitivity": 0.5214875862910846 }, { "name": "model.layers.18.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.718937609344721e-05, "sensitivity": 0.8210119567374976 }, { "name": "model.layers.18.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.745857490386697e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006240094662643969, "sensitivity": 0.5435873161001123 }, { "name": "model.layers.18.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.224722892511636e-05, "sensitivity": 0.7623165971387024 }, { "name": "model.layers.18.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.156503443184192e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007105501717887819, "sensitivity": 0.5466298288242215 }, { "name": "model.layers.18.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0061551620310638e-05, "sensitivity": 1.9632300221385734 }, { "name": "model.layers.18.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.652941013067903e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006156706949695945, "sensitivity": 0.5590213418084131 }, { "name": "model.layers.18.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006565309013240039, "sensitivity": 0.5813253206507992 }, { "name": "model.layers.18.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.725742309754423e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006417898694053292, "sensitivity": 0.5401969281153957 }, { "name": "model.layers.18.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.323415436781943e-05, "sensitivity": 0.9330909836704775 }, { "name": "model.layers.18.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.677225314888346e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007071642903611064, "sensitivity": 0.5581833857689203 }, { "name": "model.layers.18.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.699681059923023e-05, "sensitivity": 1.1443021569897265 }, { "name": "model.layers.18.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.25515781393915e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006487325299531221, "sensitivity": 0.5840361352056971 }, { "name": "model.layers.18.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7568664487916976e-05, "sensitivity": 0.9337006493647872 }, { "name": "model.layers.18.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.178601665851602e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006650621071457863, "sensitivity": 0.5563182549170671 }, { "name": "model.layers.18.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006934432312846184, "sensitivity": 0.5389218499158244 }, { "name": "model.layers.18.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.231537099665729e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000681681209243834, "sensitivity": 0.5698356111088878 }, { "name": "model.layers.18.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.191273779317271e-06, "sensitivity": 2.0971314217160186 }, { "name": "model.layers.18.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.8265524078015e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.369901919038966e-05, "sensitivity": 0.8816863841051026 }, { "name": "model.layers.18.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.147066596895456e-05, "sensitivity": 0.622258677484572 }, { "name": "model.layers.18.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.287692713158322e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006758943200111389, "sensitivity": 0.5466854950093959 }, { "name": "model.layers.18.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.696806329069659e-05, "sensitivity": 0.6067905940874736 }, { "name": "model.layers.18.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.368100452571525e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006174708832986653, "sensitivity": 0.5780204098313948 }, { "name": "model.layers.18.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.838385550305247e-05, "sensitivity": 0.6939487178140951 }, { "name": "model.layers.18.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.381583711525309e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006472686072811484, "sensitivity": 0.5255976296168394 }, { "name": "model.layers.18.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.645816418109462e-05, "sensitivity": 0.88480288706704 }, { "name": "model.layers.18.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.5531036120301e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006242530071176589, "sensitivity": 0.5361110409328683 }, { "name": "model.layers.18.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006980095058679581, "sensitivity": 0.5251848879563237 }, { "name": "model.layers.18.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.535058443863818e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000700572389177978, "sensitivity": 0.5626738967886133 }, { "name": "model.layers.18.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1446299140516203e-05, "sensitivity": 1.363656486968438 }, { "name": "model.layers.18.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.483998842872097e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.117915780923795e-05, "sensitivity": 1.4365983999059246 }, { "name": "model.layers.18.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9938058257102966e-05, "sensitivity": 0.7584460134545417 }, { "name": "model.layers.18.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.218741527343809e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006461074808612466, "sensitivity": 0.5545205321885806 }, { "name": "model.layers.18.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.768123082816601e-05, "sensitivity": 0.7120516206771208 }, { "name": "model.layers.18.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.957709158290527e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006421735743060708, "sensitivity": 0.5526392376418194 }, { "name": "model.layers.18.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007191387703642249, "sensitivity": 0.5527646894422348 }, { "name": "model.layers.18.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.733192433079239e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007219755789265037, "sensitivity": 0.5350909189817061 }, { "name": "model.layers.18.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.093248521210626e-05, "sensitivity": 0.7774306028741368 }, { "name": "model.layers.18.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.535520924444427e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006799651309847832, "sensitivity": 0.545475869232167 }, { "name": "model.layers.18.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.816043267259374e-05, "sensitivity": 1.1710794510465827 }, { "name": "model.layers.18.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.433490054609138e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006353770149871707, "sensitivity": 0.5431730878568697 }, { "name": "model.layers.18.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0106734407600015e-05, "sensitivity": 1.6832395978520736 }, { "name": "model.layers.18.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.611265798208478e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.489853720064275e-05, "sensitivity": 0.9629650798706694 }, { "name": "model.layers.18.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006627370603382587, "sensitivity": 0.5768224645609046 }, { "name": "model.layers.18.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.270374797168188e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006388802430592477, "sensitivity": 0.5486702356002139 }, { "name": "model.layers.18.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.68132491025608e-05, "sensitivity": 0.6102596762798426 }, { "name": "model.layers.18.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.751148925512098e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006150329136289656, "sensitivity": 0.5135808253744026 }, { "name": "model.layers.18.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.125067011453211e-05, "sensitivity": 1.0584423972168922 }, { "name": "model.layers.18.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.17971988201316e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006934773991815746, "sensitivity": 0.5352620268877318 }, { "name": "model.layers.18.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.424254388548434e-05, "sensitivity": 0.7771946257072306 }, { "name": "model.layers.18.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.239402179948229e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007157858344726264, "sensitivity": 0.5463998723360118 }, { "name": "model.layers.18.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.234878674149513e-05, "sensitivity": 0.9960398248431956 }, { "name": "model.layers.18.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.754192665743176e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.146671512397006e-05, "sensitivity": 0.6016391237800286 }, { "name": "model.layers.18.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.030965596437454e-05, "sensitivity": 0.9749665585819647 }, { "name": "model.layers.18.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.50480865008285e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006809992482885718, "sensitivity": 0.537252745106604 }, { "name": "model.layers.18.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0353046137606725e-05, "sensitivity": 1.135109142448228 }, { "name": "model.layers.18.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.852235626160109e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006965158390812576, "sensitivity": 0.5591972827921904 }, { "name": "model.layers.18.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0989504517056048e-05, "sensitivity": 1.2584627837293307 }, { "name": "model.layers.18.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.290878324463847e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006513729458674788, "sensitivity": 0.5447699725165202 }, { "name": "model.layers.18.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.773509474238381e-05, "sensitivity": 1.0510728013324637 }, { "name": "model.layers.18.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.106434847832134e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006292964098975062, "sensitivity": 0.5731517845213719 }, { "name": "model.layers.18.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.718658212572336e-05, "sensitivity": 0.8609747065272525 }, { "name": "model.layers.18.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.406209761029459e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006257520872168243, "sensitivity": 0.5862614305788391 }, { "name": "model.layers.18.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.828587381984107e-05, "sensitivity": 0.9519449352946373 }, { "name": "model.layers.18.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.572740858246107e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00065939238993451, "sensitivity": 0.5158423532486368 }, { "name": "model.layers.18.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.609971049125306e-05, "sensitivity": 0.8167990984267717 }, { "name": "model.layers.18.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.20007414858992e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.509125185199082e-05, "sensitivity": 0.7376413067146534 }, { "name": "model.layers.18.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.940775736235082e-05, "sensitivity": 0.8513860615820007 }, { "name": "model.layers.18.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.860672551236348e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006573688006028533, "sensitivity": 0.5500838737252949 }, { "name": "model.layers.18.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.711413541575894e-05, "sensitivity": 0.6928415657598016 }, { "name": "model.layers.18.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.577610633939912e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006261933594942093, "sensitivity": 0.5304496897894063 }, { "name": "model.layers.18.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9911013522651047e-05, "sensitivity": 0.9685396768412287 }, { "name": "model.layers.18.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.591014312107291e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.054558252799325e-05, "sensitivity": 0.7148080689063118 }, { "name": "model.layers.18.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.290683010476641e-06, "sensitivity": 1.4577627528632568 }, { "name": "model.layers.18.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.395439757194254e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005845701089128852, "sensitivity": 0.5648250793369446 }, { "name": "model.layers.18.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.043287430657074e-05, "sensitivity": 0.6412887838143002 }, { "name": "model.layers.18.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.660185363216442e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006697532953694463, "sensitivity": 0.5635214183676419 }, { "name": "model.layers.18.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.571487756446004e-05, "sensitivity": 0.7445277258687123 }, { "name": "model.layers.18.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.585402161363163e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007525449618697166, "sensitivity": 0.5265433985258016 }, { "name": "model.layers.18.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.909112223889679e-05, "sensitivity": 0.7901876704240491 }, { "name": "model.layers.18.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.169098239501182e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006509320810437202, "sensitivity": 0.5543123333190413 }, { "name": "model.layers.18.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.894695641472936e-05, "sensitivity": 0.96917918038664 }, { "name": "model.layers.18.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.588190331058286e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006539045716635883, "sensitivity": 0.5825980260566714 }, { "name": "model.layers.18.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0869334801100194e-05, "sensitivity": 1.2393846095289944 }, { "name": "model.layers.18.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.01183887233492e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8889530919259414e-05, "sensitivity": 0.6121964562604877 }, { "name": "model.layers.18.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.468895298894495e-05, "sensitivity": 0.6128540419506227 }, { "name": "model.layers.18.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.528240075771464e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.478426803369075e-05, "sensitivity": 0.6048557244950232 }, { "name": "model.layers.18.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8650370192481205e-05, "sensitivity": 0.6247889750291721 }, { "name": "model.layers.18.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.643853680543543e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006457070121541619, "sensitivity": 0.5417162388419479 }, { "name": "model.layers.18.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6873905123211443e-05, "sensitivity": 0.6064556502180046 }, { "name": "model.layers.18.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.506510198458272e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006157317548058927, "sensitivity": 0.540864845723175 }, { "name": "model.layers.18.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1194555554538965e-05, "sensitivity": 1.4448165309156729 }, { "name": "model.layers.18.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.862867844072753e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.16025718045421e-05, "sensitivity": 0.6007817280836287 }, { "name": "model.layers.18.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0741776350187138e-05, "sensitivity": 1.31863642277804 }, { "name": "model.layers.18.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.825353011663537e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.077845081454143e-05, "sensitivity": 1.3873834400804583 }, { "name": "model.layers.18.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.586366751231253e-05, "sensitivity": 1.0963588271794014 }, { "name": "model.layers.18.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.272034056564735e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006295155035331845, "sensitivity": 0.5594815997505217 }, { "name": "model.layers.18.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.197067811328452e-06, "sensitivity": 1.992892443254145 }, { "name": "model.layers.18.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.621894842988695e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.028600571677089e-05, "sensitivity": 0.6490427340392377 }, { "name": "model.layers.18.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006872533122077584, "sensitivity": 0.5491348209456268 }, { "name": "model.layers.18.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.136735919426428e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006915683625265956, "sensitivity": 0.5199439361852398 }, { "name": "model.layers.18.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0277489309373777e-05, "sensitivity": 1.8889414671389742 }, { "name": "model.layers.18.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.731064440326008e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.530676571652293e-05, "sensitivity": 0.727865579312458 }, { "name": "model.layers.18.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.344218854792416e-05, "sensitivity": 0.9913448328897938 }, { "name": "model.layers.18.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.570662662852556e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007164551643654704, "sensitivity": 0.5579995212603616 }, { "name": "model.layers.18.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0033345461124554e-05, "sensitivity": 1.3454417738520528 }, { "name": "model.layers.18.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.598412258223107e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006325780414044857, "sensitivity": 0.572077799423882 }, { "name": "model.layers.18.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006393682560883462, "sensitivity": 0.5628403439788878 }, { "name": "model.layers.18.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0273363386659184e-06, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006133638671599329, "sensitivity": 0.5262693254632584 }, { "name": "model.layers.18.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.090050136554055e-05, "sensitivity": 1.4282971426629516 }, { "name": "model.layers.18.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.286257641681004e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0455869970610365e-05, "sensitivity": 0.76831631769947 }, { "name": "model.layers.18.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.041878805262968e-05, "sensitivity": 0.7840448570198159 }, { "name": "model.layers.18.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.915379344718531e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006594274891540408, "sensitivity": 0.5622263718441824 }, { "name": "model.layers.18.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.720616536564194e-05, "sensitivity": 0.8860686427366288 }, { "name": "model.layers.18.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.56255451758625e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006297365762293339, "sensitivity": 0.5238387137732312 }, { "name": "model.layers.18.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.972495273454115e-05, "sensitivity": 0.6619986584914582 }, { "name": "model.layers.18.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.812341553086299e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006689619622193277, "sensitivity": 0.5740431880616034 }, { "name": "model.layers.18.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.004161822493188e-05, "sensitivity": 1.6872062508261338 }, { "name": "model.layers.18.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0078637160404469e-06, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5902964959386736e-05, "sensitivity": 0.8143149044527186 }, { "name": "model.layers.18.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8473480748943985e-05, "sensitivity": 0.8741074547308023 }, { "name": "model.layers.18.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.632043323406833e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006402199505828321, "sensitivity": 0.5236312940989641 }, { "name": "model.layers.18.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000685560517013073, "sensitivity": 0.5448568300953934 }, { "name": "model.layers.18.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.878816520838882e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006672485615126789, "sensitivity": 0.5609565789796327 }, { "name": "model.layers.18.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.734939986723475e-05, "sensitivity": 1.1768944530365477 }, { "name": "model.layers.18.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.826556955275009e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.797428821097128e-05, "sensitivity": 0.9542206857208423 }, { "name": "model.layers.18.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006780046387575567, "sensitivity": 0.5419885667435584 }, { "name": "model.layers.18.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.192631190060638e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006906039780005813, "sensitivity": 0.5287099810273603 }, { "name": "model.layers.18.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 4.257918590155896e-06, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.351557668589521e-06, "sensitivity": 2.1001130731669697 }, { "name": "model.layers.18.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.562369208040764e-07, "sensitivity": 10.0 }, { "name": "model.layers.18.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.763187128744903e-06, "sensitivity": 2.1043345314663116 }, { "name": "model.layers.18.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 2.7376900106901303e-05, "sensitivity": 1.748111329280677 }, { "name": "model.layers.18.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00018819123215507716, "sensitivity": 0.939685310589093 }, { "name": "model.layers.18.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.4522366655000951e-05, "sensitivity": 1.4164708630351979 }, { "name": "model.layers.18.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 6.193553417688236e-05, "sensitivity": 0.8128216660411776 }, { "name": "model.layers.18.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00026967673329636455, "sensitivity": 0.8376330955839231 }, { "name": "model.layers.19.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.876152863493189e-05, "sensitivity": 0.9368657139138483 }, { "name": "model.layers.19.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.310688374673191e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006349773029796779, "sensitivity": 0.5270105783285124 }, { "name": "model.layers.19.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.259953806875274e-05, "sensitivity": 0.8309648218957209 }, { "name": "model.layers.19.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.041017167670361e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000707445084117353, "sensitivity": 0.5697585547036377 }, { "name": "model.layers.19.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1552239811862819e-05, "sensitivity": 1.9940469018311662 }, { "name": "model.layers.19.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.059434435381263e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007168753072619438, "sensitivity": 0.5855177099166555 }, { "name": "model.layers.19.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.877359944861382e-05, "sensitivity": 0.8317974205649971 }, { "name": "model.layers.19.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.268306833590032e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006605886737816036, "sensitivity": 0.5294591891768197 }, { "name": "model.layers.19.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.942988718743436e-05, "sensitivity": 0.7317001785306171 }, { "name": "model.layers.19.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.702496986894403e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006537871668115258, "sensitivity": 0.5614494155288321 }, { "name": "model.layers.19.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7493285567034036e-05, "sensitivity": 0.74912740993433 }, { "name": "model.layers.19.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.849329222153756e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006556273438036442, "sensitivity": 0.5169610193034113 }, { "name": "model.layers.19.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.11172872595489e-05, "sensitivity": 1.0240929741990898 }, { "name": "model.layers.19.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.864110559945402e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007101434166543186, "sensitivity": 0.5668135204597028 }, { "name": "model.layers.19.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0779192962218076e-05, "sensitivity": 1.3815098479254246 }, { "name": "model.layers.19.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.660407052549999e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000644977088086307, "sensitivity": 0.5246232033408615 }, { "name": "model.layers.19.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.016890984028578e-05, "sensitivity": 0.8749706893868465 }, { "name": "model.layers.19.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.213451469084248e-06, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006543492199853063, "sensitivity": 0.5464301223789266 }, { "name": "model.layers.19.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1416795132390689e-05, "sensitivity": 1.3399636240782893 }, { "name": "model.layers.19.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.445188430210692e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007023645448498428, "sensitivity": 0.5562947351959591 }, { "name": "model.layers.19.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.57997588859871e-05, "sensitivity": 0.7067773016060271 }, { "name": "model.layers.19.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.104636322059378e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007509188144467771, "sensitivity": 0.5439033586991099 }, { "name": "model.layers.19.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9385925851529464e-05, "sensitivity": 0.8603636076457223 }, { "name": "model.layers.19.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.483292054326739e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006425100727938116, "sensitivity": 0.5483396439029959 }, { "name": "model.layers.19.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.850428715348244e-05, "sensitivity": 0.917049505608442 }, { "name": "model.layers.19.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.43550196805154e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006576854502782226, "sensitivity": 0.5353209026079859 }, { "name": "model.layers.19.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9805977798532695e-05, "sensitivity": 0.7073645233342587 }, { "name": "model.layers.19.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.104859266997664e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006434014067053795, "sensitivity": 0.5136237217934313 }, { "name": "model.layers.19.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.790881550638005e-05, "sensitivity": 0.6746842164845195 }, { "name": "model.layers.19.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.669226190249901e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006430658977478743, "sensitivity": 0.5316611349241777 }, { "name": "model.layers.19.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1670016647258308e-05, "sensitivity": 1.4198787003951607 }, { "name": "model.layers.19.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.171982699423097e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9268564655212685e-05, "sensitivity": 1.1612546878941197 }, { "name": "model.layers.19.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.410056084860116e-05, "sensitivity": 1.1977430586384112 }, { "name": "model.layers.19.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.534887688758317e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.193156877998263e-05, "sensitivity": 0.6426313137038404 }, { "name": "model.layers.19.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0938560990325641e-05, "sensitivity": 1.5229179097209378 }, { "name": "model.layers.19.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.414420568034984e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006432022200897336, "sensitivity": 0.5540096741732735 }, { "name": "model.layers.19.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1358623851265293e-05, "sensitivity": 1.3514023818537826 }, { "name": "model.layers.19.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.265703061420936e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.020099681336433e-05, "sensitivity": 0.6881783824875676 }, { "name": "model.layers.19.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9370500821387395e-05, "sensitivity": 1.000517065076244 }, { "name": "model.layers.19.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.684481827003765e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7954057410825044e-05, "sensitivity": 0.7661674736962873 }, { "name": "model.layers.19.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.829852307215333e-05, "sensitivity": 0.7800568850120693 }, { "name": "model.layers.19.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.891523642276297e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006413793889805675, "sensitivity": 0.5273246737813941 }, { "name": "model.layers.19.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.03534748632228e-05, "sensitivity": 1.237982908836851 }, { "name": "model.layers.19.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.749897127316217e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006312556797638535, "sensitivity": 0.5214923819024371 }, { "name": "model.layers.19.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9394555137259886e-05, "sensitivity": 0.6022237444304146 }, { "name": "model.layers.19.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.282489491444721e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000661953235976398, "sensitivity": 0.5213066511546013 }, { "name": "model.layers.19.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0869973822264e-05, "sensitivity": 0.965217678933039 }, { "name": "model.layers.19.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.181866183396778e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.991503348923288e-05, "sensitivity": 0.7317969912218751 }, { "name": "model.layers.19.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0501854022732005e-05, "sensitivity": 0.6333966674190391 }, { "name": "model.layers.19.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.728493756076205e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006635775207541883, "sensitivity": 0.5422034039721404 }, { "name": "model.layers.19.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1186511073901784e-05, "sensitivity": 1.5852904173513238 }, { "name": "model.layers.19.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.229607490444323e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006725361454300582, "sensitivity": 0.5521411792781745 }, { "name": "model.layers.19.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0126621974632144e-05, "sensitivity": 0.7493393007724858 }, { "name": "model.layers.19.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.61504770960164e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006824489100836217, "sensitivity": 0.5163088920234953 }, { "name": "model.layers.19.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006555861327797174, "sensitivity": 0.5185057049699867 }, { "name": "model.layers.19.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.237295219259977e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006527978694066405, "sensitivity": 0.5649147913536021 }, { "name": "model.layers.19.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.648800187278539e-06, "sensitivity": 1.5248140186814423 }, { "name": "model.layers.19.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.416620751930168e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.0684320740401745e-05, "sensitivity": 1.1521271074738644 }, { "name": "model.layers.19.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.046374200086575e-05, "sensitivity": 1.2983556341420088 }, { "name": "model.layers.19.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.616221751050034e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006142151542007923, "sensitivity": 0.532298515853381 }, { "name": "model.layers.19.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1996706234640442e-05, "sensitivity": 1.409989136042963 }, { "name": "model.layers.19.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.979807949392125e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000729390827473253, "sensitivity": 0.5574213863237296 }, { "name": "model.layers.19.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7058838137891144e-05, "sensitivity": 1.0910861709878656 }, { "name": "model.layers.19.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.890665531500417e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006176017923280597, "sensitivity": 0.543391802687166 }, { "name": "model.layers.19.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.495629011420533e-05, "sensitivity": 0.9440054367767609 }, { "name": "model.layers.19.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.688152100447041e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006264374824240804, "sensitivity": 0.5060698892120897 }, { "name": "model.layers.19.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.08495574851986e-05, "sensitivity": 0.865017073203918 }, { "name": "model.layers.19.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.289267275860766e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9303354646544904e-05, "sensitivity": 0.61350072645335 }, { "name": "model.layers.19.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.007466436130926e-05, "sensitivity": 0.7315432443963399 }, { "name": "model.layers.19.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.146688290049497e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006752772023901343, "sensitivity": 0.5580532278967869 }, { "name": "model.layers.19.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.98758969217306e-06, "sensitivity": 1.7948311737252942 }, { "name": "model.layers.19.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.500371109221305e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.4121570428833365e-05, "sensitivity": 0.806940336370173 }, { "name": "model.layers.19.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.898196104681119e-05, "sensitivity": 1.0253559648879715 }, { "name": "model.layers.19.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.180082093327655e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006347540183924139, "sensitivity": 0.5678225359521688 }, { "name": "model.layers.19.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.86785827181302e-05, "sensitivity": 0.7884680195882199 }, { "name": "model.layers.19.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.320281494889059e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006497708964161575, "sensitivity": 0.5132727013943641 }, { "name": "model.layers.19.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0107657191110775e-05, "sensitivity": 0.9028489549481789 }, { "name": "model.layers.19.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.533018108711985e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006651212461292744, "sensitivity": 0.5272881597419466 }, { "name": "model.layers.19.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.000467692501843e-05, "sensitivity": 0.7962600343848137 }, { "name": "model.layers.19.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.978726562716474e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006556756561622024, "sensitivity": 0.528546177834924 }, { "name": "model.layers.19.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.531976396217942e-05, "sensitivity": 0.7945056822522613 }, { "name": "model.layers.19.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.429080142173916e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007344274781644344, "sensitivity": 0.5998834423806344 }, { "name": "model.layers.19.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0258127632550895e-05, "sensitivity": 1.0351481610543374 }, { "name": "model.layers.19.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.659463676645828e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0643091273959726e-05, "sensitivity": 0.6642043776674201 }, { "name": "model.layers.19.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.287489668466151e-05, "sensitivity": 0.7697996550016973 }, { "name": "model.layers.19.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.583856813653256e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007254955125972629, "sensitivity": 0.5336876911035394 }, { "name": "model.layers.19.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.844206942943856e-06, "sensitivity": 1.2026372358492396 }, { "name": "model.layers.19.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1747588359867223e-06, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 9.470925760979299e-06, "sensitivity": 1.2443409414190048 }, { "name": "model.layers.19.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0849811587831937e-05, "sensitivity": 1.372281356271063 }, { "name": "model.layers.19.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.605294965491339e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.829457950312644e-05, "sensitivity": 0.8463575006522699 }, { "name": "model.layers.19.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.615096208406612e-05, "sensitivity": 0.6683099975122065 }, { "name": "model.layers.19.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.04539615981048e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007404100033454597, "sensitivity": 0.5775761645867791 }, { "name": "model.layers.19.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9947829868178815e-05, "sensitivity": 0.833319800020328 }, { "name": "model.layers.19.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.96244443993055e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6680852139834315e-05, "sensitivity": 0.6161824330517606 }, { "name": "model.layers.19.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.2359560059849173e-05, "sensitivity": 1.6926097357846164 }, { "name": "model.layers.19.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.683429430471733e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.319249223452061e-05, "sensitivity": 1.0520214437640174 }, { "name": "model.layers.19.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0833906344487332e-05, "sensitivity": 1.2135509357842302 }, { "name": "model.layers.19.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.809052249285742e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006605993257835507, "sensitivity": 0.5455926154489663 }, { "name": "model.layers.19.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.747075192630291e-05, "sensitivity": 0.7130982560577908 }, { "name": "model.layers.19.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.498507332253212e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000653569120913744, "sensitivity": 0.548043846657554 }, { "name": "model.layers.19.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6294411479029804e-05, "sensitivity": 0.9590650951367612 }, { "name": "model.layers.19.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.248493597624474e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.4627111239824444e-05, "sensitivity": 0.6513163519566365 }, { "name": "model.layers.19.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.134665944846347e-05, "sensitivity": 1.3315920161631412 }, { "name": "model.layers.19.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.053348796631326e-06, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007221802952699363, "sensitivity": 0.5895840052086339 }, { "name": "model.layers.19.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.741901622968726e-05, "sensitivity": 0.7645136066760989 }, { "name": "model.layers.19.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.351462383870967e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006328622112050653, "sensitivity": 0.5461907344128292 }, { "name": "model.layers.19.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.404653347795829e-05, "sensitivity": 1.179558587592771 }, { "name": "model.layers.19.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.664168831273855e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.427856740425341e-05, "sensitivity": 0.6141391982924809 }, { "name": "model.layers.19.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7651424867799506e-05, "sensitivity": 0.7277730013884077 }, { "name": "model.layers.19.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0248520538880257e-06, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006189779378473759, "sensitivity": 0.5697858442907295 }, { "name": "model.layers.19.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0931367796729319e-05, "sensitivity": 1.4032921112624044 }, { "name": "model.layers.19.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.094611535445438e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000666033651214093, "sensitivity": 0.5420334555032834 }, { "name": "model.layers.19.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.884556958335452e-05, "sensitivity": 1.0708581382907387 }, { "name": "model.layers.19.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.483180072791583e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006568226963281631, "sensitivity": 0.536442410387929 }, { "name": "model.layers.19.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.833373870700598e-05, "sensitivity": 1.015433603172787 }, { "name": "model.layers.19.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.138424737400783e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006581383058801293, "sensitivity": 0.5304815211887368 }, { "name": "model.layers.19.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0427773860283196e-05, "sensitivity": 0.9364708316005375 }, { "name": "model.layers.19.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.87486021888617e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006520829047076404, "sensitivity": 0.5654456146318855 }, { "name": "model.layers.19.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.1925652617937885e-06, "sensitivity": 2.0972786766816274 }, { "name": "model.layers.19.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.89389355052117e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.375222099246457e-05, "sensitivity": 0.6475168023822913 }, { "name": "model.layers.19.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8241388614987954e-05, "sensitivity": 1.0682038408475387 }, { "name": "model.layers.19.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.678812158294022e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006347006419673562, "sensitivity": 0.5723633529378053 }, { "name": "model.layers.19.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.98369151703082e-05, "sensitivity": 0.6645464671032554 }, { "name": "model.layers.19.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.031452125578653e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006706027197651565, "sensitivity": 0.5517007175599339 }, { "name": "model.layers.19.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006556607550010085, "sensitivity": 0.5512331352882991 }, { "name": "model.layers.19.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.89728870181716e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006292978650890291, "sensitivity": 0.525099748941682 }, { "name": "model.layers.19.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.029702126397751e-05, "sensitivity": 0.9656435215990208 }, { "name": "model.layers.19.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.664469651695981e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006722956895828247, "sensitivity": 0.557957691165478 }, { "name": "model.layers.19.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 4.0031973185250536e-06, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3383036023005843e-06, "sensitivity": 2.099834170023734 }, { "name": "model.layers.19.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.417579925255268e-07, "sensitivity": 10.0 }, { "name": "model.layers.19.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 7.790118615957908e-06, "sensitivity": 1.386085282875864 }, { "name": "model.layers.19.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 3.192814256181009e-05, "sensitivity": 1.9421012090134682 }, { "name": "model.layers.19.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00018077378626912832, "sensitivity": 1.0690458319870662 }, { "name": "model.layers.19.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.643800896999892e-05, "sensitivity": 1.258131320190985 }, { "name": "model.layers.19.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 2, "mse": 0.0006832742947153747, "sensitivity": 0.5504496310558208 }, { "name": "model.layers.19.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002673773851711303, "sensitivity": 0.7335318994903526 }, { "name": "model.layers.20.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.961624265182763e-05, "sensitivity": 1.1916419808917444 }, { "name": "model.layers.20.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.023475288609916e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000653678725939244, "sensitivity": 0.5454899039390482 }, { "name": "model.layers.20.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007260659476742148, "sensitivity": 0.558578567938649 }, { "name": "model.layers.20.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.65069535443763e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006928014336153865, "sensitivity": 0.5619652476146978 }, { "name": "model.layers.20.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.731965939048678e-05, "sensitivity": 0.8083513440873115 }, { "name": "model.layers.20.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.098125027165224e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006385261658579111, "sensitivity": 0.5155225274504436 }, { "name": "model.layers.20.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.111292168498039e-05, "sensitivity": 0.7800007594133374 }, { "name": "model.layers.20.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0853761978069087e-06, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006966580986045301, "sensitivity": 0.5938431191585292 }, { "name": "model.layers.20.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.28968991804868e-05, "sensitivity": 1.094395647017167 }, { "name": "model.layers.20.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.894449254308711e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006917395512573421, "sensitivity": 0.5802581662989211 }, { "name": "model.layers.20.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.997137850499712e-05, "sensitivity": 0.8147287335770342 }, { "name": "model.layers.20.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.072899623177364e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006632154108956456, "sensitivity": 0.5266012694026626 }, { "name": "model.layers.20.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.024046888342127e-05, "sensitivity": 0.621071143835717 }, { "name": "model.layers.20.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.984358833506121e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006495471461676061, "sensitivity": 0.5454412458445417 }, { "name": "model.layers.20.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1901624020538293e-05, "sensitivity": 1.2660654527481943 }, { "name": "model.layers.20.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.73505405504693e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007166418945416808, "sensitivity": 0.5473248265596455 }, { "name": "model.layers.20.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.896115180803463e-05, "sensitivity": 0.9732723633923882 }, { "name": "model.layers.20.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.084046723728534e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006447415798902512, "sensitivity": 0.5699147117777952 }, { "name": "model.layers.20.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.380700506269932e-05, "sensitivity": 0.7754000973915249 }, { "name": "model.layers.20.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.505779310828075e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007014956208877265, "sensitivity": 0.5447520914846815 }, { "name": "model.layers.20.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1279113095952198e-05, "sensitivity": 1.3353169363381971 }, { "name": "model.layers.20.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.66623247222742e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00068761280272156, "sensitivity": 0.5587166741328682 }, { "name": "model.layers.20.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1129122867714614e-05, "sensitivity": 1.362740400456367 }, { "name": "model.layers.20.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.079289960325696e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006673883181065321, "sensitivity": 0.5735166742662103 }, { "name": "model.layers.20.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0410891263745725e-05, "sensitivity": 1.572998315131814 }, { "name": "model.layers.20.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.779949105999549e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006365698645822704, "sensitivity": 0.5785869438462765 }, { "name": "model.layers.20.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.821452214149758e-05, "sensitivity": 0.7819496616151946 }, { "name": "model.layers.20.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.246266816058778e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.634051558445208e-05, "sensitivity": 0.6834350239893332 }, { "name": "model.layers.20.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.642544056172483e-05, "sensitivity": 1.1578293132151791 }, { "name": "model.layers.20.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.620047431875719e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.466632865136489e-05, "sensitivity": 0.9142775563345338 }, { "name": "model.layers.20.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.207567639648914e-05, "sensitivity": 1.0139544612624622 }, { "name": "model.layers.20.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.489703991974238e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007027639076113701, "sensitivity": 0.5763819346659312 }, { "name": "model.layers.20.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.33366871625185e-05, "sensitivity": 0.7636777835754364 }, { "name": "model.layers.20.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.137062081914337e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007067638216540217, "sensitivity": 0.560823282249965 }, { "name": "model.layers.20.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.233137537492439e-05, "sensitivity": 1.127482327769577 }, { "name": "model.layers.20.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.131464260761277e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000672479160130024, "sensitivity": 0.563138616987967 }, { "name": "model.layers.20.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.2768135750084184e-06, "sensitivity": 2.0112249942968745 }, { "name": "model.layers.20.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.651580406469293e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.230555689195171e-05, "sensitivity": 0.9631153478214038 }, { "name": "model.layers.20.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0674742043192964e-05, "sensitivity": 1.2206043971814293 }, { "name": "model.layers.20.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.995870537844894e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006441769655793905, "sensitivity": 0.5460091414469681 }, { "name": "model.layers.20.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.538719753734767e-05, "sensitivity": 1.053729067020045 }, { "name": "model.layers.20.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.265975341397279e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.419725104933605e-05, "sensitivity": 0.614372991475755 }, { "name": "model.layers.20.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.959677218925208e-05, "sensitivity": 1.027089020236314 }, { "name": "model.layers.20.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.246784884453518e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006592316785827279, "sensitivity": 0.5521797051275956 }, { "name": "model.layers.20.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.308910087682307e-05, "sensitivity": 0.9248132098272854 }, { "name": "model.layers.20.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.302560334210284e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.142591882962734e-05, "sensitivity": 0.637414335902284 }, { "name": "model.layers.20.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1367227671144065e-05, "sensitivity": 1.8346651201542072 }, { "name": "model.layers.20.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.400272122344177e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.208679405972362e-05, "sensitivity": 0.6651005247440128 }, { "name": "model.layers.20.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.102721034840215e-05, "sensitivity": 1.5244497404667137 }, { "name": "model.layers.20.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.961745384614915e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9643934946507215e-05, "sensitivity": 0.695110920857563 }, { "name": "model.layers.20.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1616614756349009e-05, "sensitivity": 1.390316483217166 }, { "name": "model.layers.20.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.207851240309537e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006977186421863735, "sensitivity": 0.5334477169753207 }, { "name": "model.layers.20.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.207222759258002e-05, "sensitivity": 0.8834528181524062 }, { "name": "model.layers.20.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.692844974371837e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006551377009600401, "sensitivity": 0.5788208403768159 }, { "name": "model.layers.20.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1329204426147044e-05, "sensitivity": 1.2888320183054887 }, { "name": "model.layers.20.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.889672583085485e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.1504132999107242e-05, "sensitivity": 1.5431553725436902 }, { "name": "model.layers.20.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.740686901845038e-05, "sensitivity": 1.1837355224122694 }, { "name": "model.layers.20.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.184998824210197e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6090513680828735e-05, "sensitivity": 0.6873437541620037 }, { "name": "model.layers.20.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.046454235620331e-05, "sensitivity": 1.6128239070207657 }, { "name": "model.layers.20.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.744840336774359e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5701144447084516e-05, "sensitivity": 0.6123968877190555 }, { "name": "model.layers.20.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0920501154032536e-05, "sensitivity": 1.620761244475798 }, { "name": "model.layers.20.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.075031251384644e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006550023099407554, "sensitivity": 0.5649350499684704 }, { "name": "model.layers.20.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.172854773467407e-05, "sensitivity": 1.1586999967765297 }, { "name": "model.layers.20.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.649045983271208e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006698516081087291, "sensitivity": 0.5922356645552063 }, { "name": "model.layers.20.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.19320198893547e-05, "sensitivity": 0.8493296410244968 }, { "name": "model.layers.20.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.401502901098866e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006774346111342311, "sensitivity": 0.5717505990487768 }, { "name": "model.layers.20.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.588730320800096e-05, "sensitivity": 1.1546306379737472 }, { "name": "model.layers.20.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.814826060188352e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.806179590057582e-05, "sensitivity": 0.9701636485703039 }, { "name": "model.layers.20.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0848245437955484e-05, "sensitivity": 1.819937022744789 }, { "name": "model.layers.20.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.056972097212565e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.738443724112585e-05, "sensitivity": 0.6192220301851763 }, { "name": "model.layers.20.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.027605559211224e-05, "sensitivity": 0.9054179887435536 }, { "name": "model.layers.20.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.192144835244108e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006684227264486253, "sensitivity": 0.5382310001134892 }, { "name": "model.layers.20.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1007088687620126e-05, "sensitivity": 1.7554986195726427 }, { "name": "model.layers.20.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.19981392446789e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006586122326552868, "sensitivity": 0.5944542380048052 }, { "name": "model.layers.20.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0377259968663566e-05, "sensitivity": 1.2745752563793746 }, { "name": "model.layers.20.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.380104196068714e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006331743206828833, "sensitivity": 0.5394281888333716 }, { "name": "model.layers.20.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.683744140900671e-05, "sensitivity": 0.9976576812085537 }, { "name": "model.layers.20.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.427003652082931e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007456554449163377, "sensitivity": 0.5582909850495396 }, { "name": "model.layers.20.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0279762136633508e-05, "sensitivity": 1.477514274928815 }, { "name": "model.layers.20.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.367549864691682e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5681255616946146e-05, "sensitivity": 0.7416347049486325 }, { "name": "model.layers.20.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.66761989123188e-05, "sensitivity": 0.9848148761165249 }, { "name": "model.layers.20.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.466067017958267e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007716318359598517, "sensitivity": 0.558240680385377 }, { "name": "model.layers.20.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.949829937890172e-05, "sensitivity": 0.905795314002399 }, { "name": "model.layers.20.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.631507514815894e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000659218174405396, "sensitivity": 0.5306706047995501 }, { "name": "model.layers.20.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.127789674792439e-05, "sensitivity": 1.0301379235554617 }, { "name": "model.layers.20.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.736122592585161e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006708709406666458, "sensitivity": 0.5484715766211175 }, { "name": "model.layers.20.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.70923909638077e-05, "sensitivity": 0.9241821580671827 }, { "name": "model.layers.20.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.978014420790714e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.763505371054634e-05, "sensitivity": 0.8807684402131044 }, { "name": "model.layers.20.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.050448791938834e-05, "sensitivity": 0.8679977555904304 }, { "name": "model.layers.20.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.544666462104942e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006482892786152661, "sensitivity": 0.570132743848603 }, { "name": "model.layers.20.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.381754064932466e-05, "sensitivity": 0.9543989653470197 }, { "name": "model.layers.20.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.033422318476369e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006927655776962638, "sensitivity": 0.5465341664004278 }, { "name": "model.layers.20.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0581162314338144e-05, "sensitivity": 1.712146219629282 }, { "name": "model.layers.20.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.420850801689085e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.0253881555399857e-05, "sensitivity": 1.550776928042143 }, { "name": "model.layers.20.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.031189695931971e-05, "sensitivity": 0.9216292772220124 }, { "name": "model.layers.20.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.000300570325635e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006763345445506275, "sensitivity": 0.5475465354076753 }, { "name": "model.layers.20.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.472907261922956e-05, "sensitivity": 0.8547923224195489 }, { "name": "model.layers.20.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.879174065943516e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006940357270650566, "sensitivity": 0.5636609558215082 }, { "name": "model.layers.20.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1034686394850723e-05, "sensitivity": 1.3709432762271838 }, { "name": "model.layers.20.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.199471727086348e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006840967107564211, "sensitivity": 0.5928577602703559 }, { "name": "model.layers.20.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0009224398527294e-05, "sensitivity": 0.9343061735791691 }, { "name": "model.layers.20.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.999666197771148e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006848049233667552, "sensitivity": 0.5339999918743596 }, { "name": "model.layers.20.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0380710591562092e-05, "sensitivity": 1.3355791098210417 }, { "name": "model.layers.20.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.913892096032214e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.687677185051143e-05, "sensitivity": 0.8344424737458406 }, { "name": "model.layers.20.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.2030905054416507e-05, "sensitivity": 1.372299701064696 }, { "name": "model.layers.20.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.529755521318293e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007453722646459937, "sensitivity": 0.542862276386131 }, { "name": "model.layers.20.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.866892752237618e-05, "sensitivity": 0.7536253260902532 }, { "name": "model.layers.20.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.079810870891379e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006729393498972058, "sensitivity": 0.5919462851701527 }, { "name": "model.layers.20.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.586630479432642e-05, "sensitivity": 1.1753121405955858 }, { "name": "model.layers.20.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1028976132365642e-06, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.735823990311474e-05, "sensitivity": 0.6074948195154166 }, { "name": "model.layers.20.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0839878086699173e-05, "sensitivity": 1.276936828094001 }, { "name": "model.layers.20.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.775577847089153e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006449393695220351, "sensitivity": 0.5160687124382078 }, { "name": "model.layers.20.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0283423762302846e-05, "sensitivity": 1.3334902539381457 }, { "name": "model.layers.20.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.314206863564323e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006283309776335955, "sensitivity": 0.5997061915728015 }, { "name": "model.layers.20.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.033540557837114e-05, "sensitivity": 0.7628965819978677 }, { "name": "model.layers.20.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.498334528259875e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006860859575681388, "sensitivity": 0.5043214022280578 }, { "name": "model.layers.20.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0406653018435463e-05, "sensitivity": 1.9796778402191213 }, { "name": "model.layers.20.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.502517291868571e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.616348789772019e-05, "sensitivity": 1.1078518719400512 }, { "name": "model.layers.20.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.542096449877135e-06, "sensitivity": 1.7564646766345273 }, { "name": "model.layers.20.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.519221986105549e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.0778500735759735e-05, "sensitivity": 0.9458449278470007 }, { "name": "model.layers.20.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.372154166456312e-05, "sensitivity": 0.990856333627188 }, { "name": "model.layers.20.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.570590921408439e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.435949762817472e-05, "sensitivity": 0.734999072091588 }, { "name": "model.layers.20.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.672129918821156e-05, "sensitivity": 0.9204653334196655 }, { "name": "model.layers.20.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0373216809966834e-06, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006376021774485707, "sensitivity": 0.5604044189238739 }, { "name": "model.layers.20.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1420552255003713e-05, "sensitivity": 1.4456218373715932 }, { "name": "model.layers.20.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.444972993653209e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006774680223315954, "sensitivity": 0.5310657656391488 }, { "name": "model.layers.20.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0526945162564516e-05, "sensitivity": 1.0166908052597403 }, { "name": "model.layers.20.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.331118692694872e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006412116345018148, "sensitivity": 0.5425306412546711 }, { "name": "model.layers.20.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 4.22104176323046e-06, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4972766823339043e-06, "sensitivity": 2.101144466001612 }, { "name": "model.layers.20.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.738845286236028e-07, "sensitivity": 10.0 }, { "name": "model.layers.20.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 8.260114555014297e-06, "sensitivity": 1.7497824349980893 }, { "name": "model.layers.20.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 6.9907564466120675e-06, "sensitivity": 2.0597086861660436 }, { "name": "model.layers.20.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00020233738177921623, "sensitivity": 1.0101991886306045 }, { "name": "model.layers.20.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.454328048566822e-05, "sensitivity": 1.4035260193678885 }, { "name": "model.layers.20.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.8794459619093686e-05, "sensitivity": 0.6302626247618112 }, { "name": "model.layers.20.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0003008406492881477, "sensitivity": 0.825203343686161 }, { "name": "model.layers.21.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.470707012340426e-05, "sensitivity": 1.1405754990494357 }, { "name": "model.layers.21.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.869817070764839e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00071334297535941, "sensitivity": 0.5277189655509682 }, { "name": "model.layers.21.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.145892984932289e-05, "sensitivity": 0.8981685082232558 }, { "name": "model.layers.21.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.423890338031924e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006810436025261879, "sensitivity": 0.5441798069500908 }, { "name": "model.layers.21.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9178313676966354e-05, "sensitivity": 0.6322503508803525 }, { "name": "model.layers.21.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.45981276142993e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006666152039542794, "sensitivity": 0.49616880216085524 }, { "name": "model.layers.21.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4089061450213194e-05, "sensitivity": 0.9503398868682165 }, { "name": "model.layers.21.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.417047870854731e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005756285972893238, "sensitivity": 0.5662198854708143 }, { "name": "model.layers.21.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9239595429971814e-05, "sensitivity": 1.181638438713063 }, { "name": "model.layers.21.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.037862701508857e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006333107594400644, "sensitivity": 0.5527928063399578 }, { "name": "model.layers.21.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.065780088538304e-05, "sensitivity": 1.5724684563124416 }, { "name": "model.layers.21.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.729625164960453e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006192586151883006, "sensitivity": 0.5613491564568702 }, { "name": "model.layers.21.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.557505210163072e-05, "sensitivity": 0.8746739087617841 }, { "name": "model.layers.21.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.352805593858648e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005968051846139133, "sensitivity": 0.5469736692587901 }, { "name": "model.layers.21.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.704361294396222e-05, "sensitivity": 1.0234870286173972 }, { "name": "model.layers.21.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.47854187466146e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.475860573118553e-05, "sensitivity": 1.0945644950246605 }, { "name": "model.layers.21.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8123514463659376e-05, "sensitivity": 0.8187532116792057 }, { "name": "model.layers.21.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.156410219977261e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006469328654929996, "sensitivity": 0.5270182753440417 }, { "name": "model.layers.21.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0189176464336924e-05, "sensitivity": 1.2672851248044037 }, { "name": "model.layers.21.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.372174539137632e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006151500856503844, "sensitivity": 0.5363336815226907 }, { "name": "model.layers.21.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.137401214800775e-05, "sensitivity": 0.9766061153983782 }, { "name": "model.layers.21.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.607788686276763e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000670911162160337, "sensitivity": 0.5338839562401135 }, { "name": "model.layers.21.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.860920646227896e-05, "sensitivity": 0.9593149572590405 }, { "name": "model.layers.21.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.483195420514676e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006587253883481026, "sensitivity": 0.5734096887531699 }, { "name": "model.layers.21.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.882800542167388e-05, "sensitivity": 0.6482169617977906 }, { "name": "model.layers.21.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.061071750693372e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000619435915723443, "sensitivity": 0.5225868773872941 }, { "name": "model.layers.21.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.589374268311076e-05, "sensitivity": 1.131786674100676 }, { "name": "model.layers.21.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.98837697604904e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.0364199624746107e-05, "sensitivity": 1.2095712247361128 }, { "name": "model.layers.21.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.336133810691535e-05, "sensitivity": 0.6485839395462321 }, { "name": "model.layers.21.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.850230758776888e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006753271445631981, "sensitivity": 0.5265299552694438 }, { "name": "model.layers.21.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.934457294642925e-05, "sensitivity": 0.8426853116919891 }, { "name": "model.layers.21.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.76200386351411e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006494239205494523, "sensitivity": 0.5330858177802806 }, { "name": "model.layers.21.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0701416613301262e-05, "sensitivity": 1.2495467924527464 }, { "name": "model.layers.21.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.606962182966527e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006318545201793313, "sensitivity": 0.5876133186381026 }, { "name": "model.layers.21.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.879285163246095e-05, "sensitivity": 0.8070965065733529 }, { "name": "model.layers.21.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.428587878166582e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006257513887248933, "sensitivity": 0.5357910339842388 }, { "name": "model.layers.21.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0835396096808836e-05, "sensitivity": 1.3922430188789718 }, { "name": "model.layers.21.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.326366701614461e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000656719203107059, "sensitivity": 0.5182769977667021 }, { "name": "model.layers.21.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0884653066750616e-05, "sensitivity": 0.8130134376217784 }, { "name": "model.layers.21.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.99333554621262e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006487469072453678, "sensitivity": 0.5774438552440821 }, { "name": "model.layers.21.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.793773743789643e-05, "sensitivity": 0.8275856461126941 }, { "name": "model.layers.21.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.71174370584049e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000605597160756588, "sensitivity": 0.5187332723226392 }, { "name": "model.layers.21.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.370445771608502e-05, "sensitivity": 0.6237224031778393 }, { "name": "model.layers.21.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.00828126759734e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006917849532328546, "sensitivity": 0.5523803057096908 }, { "name": "model.layers.21.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0309324352419935e-05, "sensitivity": 1.4048941215489588 }, { "name": "model.layers.21.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.575747650254925e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006085638306103647, "sensitivity": 0.5159564884975094 }, { "name": "model.layers.21.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6270808272529393e-05, "sensitivity": 0.8629456893193356 }, { "name": "model.layers.21.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.869498747619218e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006053994875401258, "sensitivity": 0.5243826231545688 }, { "name": "model.layers.21.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7954381190938875e-05, "sensitivity": 1.1802838393255397 }, { "name": "model.layers.21.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.645947792094375e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006071124807931483, "sensitivity": 0.4954425177365363 }, { "name": "model.layers.21.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.430847871437436e-06, "sensitivity": 2.0968226202249425 }, { "name": "model.layers.21.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.344195639940153e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000664765015244484, "sensitivity": 0.5337841621169286 }, { "name": "model.layers.21.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1897648619196843e-05, "sensitivity": 1.301363233344454 }, { "name": "model.layers.21.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.632056847091008e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.358055543387309e-05, "sensitivity": 0.8693081580805506 }, { "name": "model.layers.21.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.635792669840157e-05, "sensitivity": 0.6569584651703313 }, { "name": "model.layers.21.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.294833039850346e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007257845136336982, "sensitivity": 0.5357987850484229 }, { "name": "model.layers.21.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.584775863098912e-05, "sensitivity": 0.6107468723755627 }, { "name": "model.layers.21.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.127850156190107e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006040145526640117, "sensitivity": 0.5161898611115291 }, { "name": "model.layers.21.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.553993443958461e-05, "sensitivity": 0.6397581027143381 }, { "name": "model.layers.21.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.74033389663964e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007216609083116055, "sensitivity": 0.5211462688160122 }, { "name": "model.layers.21.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.358297832775861e-05, "sensitivity": 0.8215587668279092 }, { "name": "model.layers.21.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.375008752002032e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.261604721657932e-05, "sensitivity": 0.7148120926793915 }, { "name": "model.layers.21.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.95935741532594e-05, "sensitivity": 1.1524595037576861 }, { "name": "model.layers.21.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.17182274456718e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007819534512236714, "sensitivity": 0.5423164583934699 }, { "name": "model.layers.21.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.883823541807942e-05, "sensitivity": 0.6803150515668173 }, { "name": "model.layers.21.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.72085582462023e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00063799147028476, "sensitivity": 0.551994440533667 }, { "name": "model.layers.21.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.195553634010139e-06, "sensitivity": 2.0970824769479073 }, { "name": "model.layers.21.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.672940233125701e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000590536103118211, "sensitivity": 0.5198198146986255 }, { "name": "model.layers.21.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.757307371823117e-05, "sensitivity": 0.6360062981662613 }, { "name": "model.layers.21.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1571207778615644e-06, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006157857715152204, "sensitivity": 0.5643761312959038 }, { "name": "model.layers.21.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1914049537153915e-05, "sensitivity": 1.6130534958913352 }, { "name": "model.layers.21.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.289471568583394e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007349028019234538, "sensitivity": 0.5355710078574176 }, { "name": "model.layers.21.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.183538062032312e-05, "sensitivity": 0.9234467734891907 }, { "name": "model.layers.21.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.584716286146431e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006960986065678298, "sensitivity": 0.5607702890469304 }, { "name": "model.layers.21.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.890133616048843e-05, "sensitivity": 0.8866689404702304 }, { "name": "model.layers.21.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.730891411483753e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.465430149342865e-05, "sensitivity": 0.6053900239414027 }, { "name": "model.layers.21.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.849348963238299e-05, "sensitivity": 0.6857072491240499 }, { "name": "model.layers.21.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.906662181587308e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006367613095790148, "sensitivity": 0.5140802155664165 }, { "name": "model.layers.21.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.599655898753554e-05, "sensitivity": 1.0034940597911512 }, { "name": "model.layers.21.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.146254918348859e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.420408317353576e-05, "sensitivity": 0.6600740954700368 }, { "name": "model.layers.21.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6511118600610644e-05, "sensitivity": 0.7222658021020516 }, { "name": "model.layers.21.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.970707767730346e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5994569265749305e-05, "sensitivity": 0.63260745308644 }, { "name": "model.layers.21.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.826041888212785e-05, "sensitivity": 0.9672263150114004 }, { "name": "model.layers.21.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.385035243918537e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5761804105713964e-05, "sensitivity": 0.6158916572846231 }, { "name": "model.layers.21.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.10812712693587e-05, "sensitivity": 1.0026139040159063 }, { "name": "model.layers.21.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.617235612793593e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006627800757996738, "sensitivity": 0.5406390792211939 }, { "name": "model.layers.21.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000641274731606245, "sensitivity": 0.5634387430241662 }, { "name": "model.layers.21.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.933584586477082e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006220659706741571, "sensitivity": 0.5250074927021652 }, { "name": "model.layers.21.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6636483350303024e-05, "sensitivity": 1.1109737555801247 }, { "name": "model.layers.21.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.678537036146736e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006289500743150711, "sensitivity": 0.531988322664145 }, { "name": "model.layers.21.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9459525800775737e-05, "sensitivity": 0.9117354680240873 }, { "name": "model.layers.21.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.135742521313659e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006434587412513793, "sensitivity": 0.549942426721354 }, { "name": "model.layers.21.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8652683947002515e-05, "sensitivity": 0.7680744627554967 }, { "name": "model.layers.21.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.538255886174738e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.565858737099916e-05, "sensitivity": 0.6276297241848575 }, { "name": "model.layers.21.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9434572904137895e-05, "sensitivity": 0.9284828392958464 }, { "name": "model.layers.21.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.5544147648543e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006237897323444486, "sensitivity": 0.5534648183721057 }, { "name": "model.layers.21.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.54807809041813e-05, "sensitivity": 0.8250748164600921 }, { "name": "model.layers.21.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.711947773714201e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000730929896235466, "sensitivity": 0.5464915360339504 }, { "name": "model.layers.21.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0739082426880486e-05, "sensitivity": 1.3276580275218854 }, { "name": "model.layers.21.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.444740385333716e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.736047387472354e-05, "sensitivity": 0.685787969705762 }, { "name": "model.layers.21.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.489269096869975e-05, "sensitivity": 0.6931987539767394 }, { "name": "model.layers.21.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.986200903862482e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006049717194400728, "sensitivity": 0.5132135174887917 }, { "name": "model.layers.21.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.159242184367031e-05, "sensitivity": 0.6712487122626843 }, { "name": "model.layers.21.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.734593054919969e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9704754676204175e-05, "sensitivity": 0.623061109610997 }, { "name": "model.layers.21.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9615791542455554e-05, "sensitivity": 0.7275653637179735 }, { "name": "model.layers.21.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.111860895747668e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006256886990740895, "sensitivity": 0.5256866760678321 }, { "name": "model.layers.21.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.596443224931136e-05, "sensitivity": 1.0126009794573219 }, { "name": "model.layers.21.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.282928891072515e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006127101369202137, "sensitivity": 0.5982327648013748 }, { "name": "model.layers.21.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.682985364634078e-06, "sensitivity": 1.2538070564459824 }, { "name": "model.layers.21.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0650073818396777e-06, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.24188217241317e-05, "sensitivity": 0.6272980026541357 }, { "name": "model.layers.21.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.700580368284136e-05, "sensitivity": 0.8955829602496694 }, { "name": "model.layers.21.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.966756700421683e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006296024657785892, "sensitivity": 0.5352157491990078 }, { "name": "model.layers.21.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.539047727623256e-06, "sensitivity": 2.097609276374532 }, { "name": "model.layers.21.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3108351595292334e-06, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.636913556372747e-05, "sensitivity": 0.9781671104935199 }, { "name": "model.layers.21.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.356221274472773e-05, "sensitivity": 0.8491077840274295 }, { "name": "model.layers.21.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.405703286167409e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006949134403839707, "sensitivity": 0.52600187844559 }, { "name": "model.layers.21.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.846908243256621e-05, "sensitivity": 1.1402759260158555 }, { "name": "model.layers.21.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.328581202476926e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.680865069734864e-05, "sensitivity": 0.6586736467989712 }, { "name": "model.layers.21.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.472470002132468e-05, "sensitivity": 0.8804270933809185 }, { "name": "model.layers.21.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.694417038488609e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005938475951552391, "sensitivity": 0.5416502566170365 }, { "name": "model.layers.21.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.998781933973078e-06, "sensitivity": 1.3403120055299953 }, { "name": "model.layers.21.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.916719712535269e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 9.702158422442153e-06, "sensitivity": 1.3978888198182515 }, { "name": "model.layers.21.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1622492820606567e-05, "sensitivity": 1.2578874620116256 }, { "name": "model.layers.21.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.004314733829233e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007119872607290745, "sensitivity": 0.5313371725952815 }, { "name": "model.layers.21.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.0241859601810575e-06, "sensitivity": 2.0972836723120185 }, { "name": "model.layers.21.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.896821224065206e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 4.7952751629054546e-05, "sensitivity": 0.8504883641154154 }, { "name": "model.layers.21.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.582808418897912e-05, "sensitivity": 0.8569958708927742 }, { "name": "model.layers.21.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.205947210626618e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007280017016455531, "sensitivity": 0.5364832208362303 }, { "name": "model.layers.21.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 3.782971816690406e-06, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4380983631999698e-06, "sensitivity": 2.1007758199750826 }, { "name": "model.layers.21.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.585783237118449e-07, "sensitivity": 10.0 }, { "name": "model.layers.21.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.964564489753684e-06, "sensitivity": 2.1039044575160832 }, { "name": "model.layers.21.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 8.39658150653122e-06, "sensitivity": 2.11276756029186 }, { "name": "model.layers.21.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00019187886209692806, "sensitivity": 0.8865392553408962 }, { "name": "model.layers.21.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.7045678760041483e-05, "sensitivity": 1.3427902773651461 }, { "name": "model.layers.21.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 5, "mse": 3.0231710752559593e-06, "sensitivity": 2.0203870733171136 }, { "name": "model.layers.21.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002694542345125228, "sensitivity": 0.6575331437532186 }, { "name": "model.layers.22.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.56667907605879e-05, "sensitivity": 0.8483390800657236 }, { "name": "model.layers.22.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0087665032187942e-06, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007416922599077225, "sensitivity": 0.5616760605953999 }, { "name": "model.layers.22.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.572026904905215e-05, "sensitivity": 1.0888276061983084 }, { "name": "model.layers.22.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.836781262289151e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.316692451946437e-05, "sensitivity": 0.665804004245721 }, { "name": "model.layers.22.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.71158598177135e-05, "sensitivity": 1.113347077749221 }, { "name": "model.layers.22.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.745454245698056e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006312463083304465, "sensitivity": 0.5453714096967 }, { "name": "model.layers.22.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0667284186638426e-05, "sensitivity": 1.5706242917853293 }, { "name": "model.layers.22.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.555057320336346e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006635886966250837, "sensitivity": 0.5468768801696748 }, { "name": "model.layers.22.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7087581808445975e-05, "sensitivity": 1.1282998578813328 }, { "name": "model.layers.22.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.536180651688483e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.482445703819394e-05, "sensitivity": 0.6866101348857243 }, { "name": "model.layers.22.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.6337900180806173e-06, "sensitivity": 2.0973933110073917 }, { "name": "model.layers.22.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.964116548464517e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007536776829510927, "sensitivity": 0.550156683104402 }, { "name": "model.layers.22.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.105373667087406e-05, "sensitivity": 1.5163363240948067 }, { "name": "model.layers.22.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.457571769009519e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006607574177905917, "sensitivity": 0.5957658441687577 }, { "name": "model.layers.22.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.241083610802889e-05, "sensitivity": 0.9678169495017461 }, { "name": "model.layers.22.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.626940146110428e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.452956586144865e-05, "sensitivity": 0.609754298182538 }, { "name": "model.layers.22.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.711079575121403e-05, "sensitivity": 0.9335853188160506 }, { "name": "model.layers.22.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.272758241721021e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006226321565918624, "sensitivity": 0.55496667450775 }, { "name": "model.layers.22.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.71858327020891e-05, "sensitivity": 0.6584179212456969 }, { "name": "model.layers.22.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.20395894657122e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006378985708579421, "sensitivity": 0.5036602016905956 }, { "name": "model.layers.22.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0642343113431707e-05, "sensitivity": 1.3255387571925519 }, { "name": "model.layers.22.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.008833217194478e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006411510985344648, "sensitivity": 0.554858466198227 }, { "name": "model.layers.22.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.154163565952331e-05, "sensitivity": 1.0489646133021868 }, { "name": "model.layers.22.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.735507321944169e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000679934280924499, "sensitivity": 0.5476577570906018 }, { "name": "model.layers.22.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6347060308326036e-05, "sensitivity": 0.9368099713264783 }, { "name": "model.layers.22.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.808370577957248e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.551743015530519e-05, "sensitivity": 0.6783149444246934 }, { "name": "model.layers.22.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.870162203791551e-05, "sensitivity": 1.1278496277974495 }, { "name": "model.layers.22.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.443484489362163e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7908411690732464e-05, "sensitivity": 0.7506539027482667 }, { "name": "model.layers.22.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.07698893873021e-05, "sensitivity": 0.8698657314504603 }, { "name": "model.layers.22.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.645922780990077e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006563437054865062, "sensitivity": 0.509784640877408 }, { "name": "model.layers.22.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.620387310045771e-05, "sensitivity": 0.9380033253939282 }, { "name": "model.layers.22.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1663373697956558e-06, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006272218888625503, "sensitivity": 0.5863626444774883 }, { "name": "model.layers.22.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0950212526950054e-05, "sensitivity": 1.458229272982133 }, { "name": "model.layers.22.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.772687584088999e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.981250433251262e-05, "sensitivity": 0.6230769116990666 }, { "name": "model.layers.22.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0223220670013689e-05, "sensitivity": 1.8400098608640456 }, { "name": "model.layers.22.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.79899960939656e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5586187954759225e-05, "sensitivity": 0.6163777853223603 }, { "name": "model.layers.22.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0049890988739207e-05, "sensitivity": 1.382525075042724 }, { "name": "model.layers.22.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.531098281608138e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006045112386345863, "sensitivity": 0.5260918517310695 }, { "name": "model.layers.22.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1164775060024112e-05, "sensitivity": 1.2392061189690793 }, { "name": "model.layers.22.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.935045687190723e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006962585030123591, "sensitivity": 0.5530764193845195 }, { "name": "model.layers.22.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.2094356861780398e-05, "sensitivity": 1.9631615373680722 }, { "name": "model.layers.22.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.548454732386745e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007478423649445176, "sensitivity": 0.5237141572394394 }, { "name": "model.layers.22.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.992728256387636e-05, "sensitivity": 0.64283938750788 }, { "name": "model.layers.22.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.177745603963558e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006630040588788688, "sensitivity": 0.541999497275556 }, { "name": "model.layers.22.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.938087633694522e-05, "sensitivity": 0.7892617575982078 }, { "name": "model.layers.22.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.214918582576502e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006710853194817901, "sensitivity": 0.5315456830090102 }, { "name": "model.layers.22.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7212873798562214e-05, "sensitivity": 0.8748850829641914 }, { "name": "model.layers.22.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.666423809700063e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006374261574819684, "sensitivity": 0.5744315837111832 }, { "name": "model.layers.22.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8358309615869075e-05, "sensitivity": 0.7731973314491084 }, { "name": "model.layers.22.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.203564453244326e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006438556592911482, "sensitivity": 0.5181801839774159 }, { "name": "model.layers.22.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9135545598110184e-05, "sensitivity": 0.8112252112411666 }, { "name": "model.layers.22.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.650039037798706e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006629450945183635, "sensitivity": 0.5291117855717549 }, { "name": "model.layers.22.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0757581549114548e-05, "sensitivity": 1.2176652244739676 }, { "name": "model.layers.22.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.601946319686249e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006560278125107288, "sensitivity": 0.5503460601608802 }, { "name": "model.layers.22.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.809578578919172e-05, "sensitivity": 0.8802972772187485 }, { "name": "model.layers.22.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.908569503139006e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006448211497627199, "sensitivity": 0.5938683379514424 }, { "name": "model.layers.22.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.322897388599813e-05, "sensitivity": 0.8824782892315874 }, { "name": "model.layers.22.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.158184303079906e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007096983026713133, "sensitivity": 0.5131836444099749 }, { "name": "model.layers.22.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.736937600886449e-05, "sensitivity": 0.8296182816841178 }, { "name": "model.layers.22.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.96952759224223e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000636305776424706, "sensitivity": 0.5500020689377991 }, { "name": "model.layers.22.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0170171663048677e-05, "sensitivity": 1.4267925585460308 }, { "name": "model.layers.22.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.71945918181882e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006069838418625295, "sensitivity": 0.5343719803430172 }, { "name": "model.layers.22.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.199610652402043e-05, "sensitivity": 0.8666228868541752 }, { "name": "model.layers.22.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.611628234371892e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.004492752254009e-05, "sensitivity": 0.7627208579755788 }, { "name": "model.layers.22.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.651542207691818e-05, "sensitivity": 0.8795493610655879 }, { "name": "model.layers.22.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.479551413780428e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.834907981101424e-05, "sensitivity": 0.6009680495769741 }, { "name": "model.layers.22.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0361793101765215e-05, "sensitivity": 1.2828177540429133 }, { "name": "model.layers.22.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.962024710650439e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.705348667106591e-05, "sensitivity": 0.7234874118371908 }, { "name": "model.layers.22.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9844765928573906e-05, "sensitivity": 1.127527965254845 }, { "name": "model.layers.22.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.451617645732767e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006729811429977417, "sensitivity": 0.5333905595507623 }, { "name": "model.layers.22.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.822765524499118e-05, "sensitivity": 0.9899675928909057 }, { "name": "model.layers.22.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.752810458645399e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.816500197397545e-05, "sensitivity": 0.6585783460990875 }, { "name": "model.layers.22.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.903498822590336e-05, "sensitivity": 0.816956627817945 }, { "name": "model.layers.22.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.880795121513074e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006612031138502061, "sensitivity": 0.5298085308966607 }, { "name": "model.layers.22.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.589172360487282e-05, "sensitivity": 0.946710767029887 }, { "name": "model.layers.22.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.524612210043415e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006221960647962987, "sensitivity": 0.5574631066020017 }, { "name": "model.layers.22.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.457543349824846e-05, "sensitivity": 1.1364033967809295 }, { "name": "model.layers.22.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.841090786721907e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007323867175728083, "sensitivity": 0.5844849447142206 }, { "name": "model.layers.22.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.486240115715191e-05, "sensitivity": 1.0593538666636677 }, { "name": "model.layers.22.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.616864200419514e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006013004458509386, "sensitivity": 0.5385024622551718 }, { "name": "model.layers.22.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0558382200542837e-05, "sensitivity": 1.7843935135047038 }, { "name": "model.layers.22.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.327364184879116e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.594580579781905e-05, "sensitivity": 0.6761231227382877 }, { "name": "model.layers.22.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.824711115565151e-05, "sensitivity": 0.9158564102944027 }, { "name": "model.layers.22.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.272023706012988e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006438942509703338, "sensitivity": 0.563524588999176 }, { "name": "model.layers.22.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0486375686014071e-05, "sensitivity": 1.253854202281932 }, { "name": "model.layers.22.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.887993097530853e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006188774714246392, "sensitivity": 0.5775393408245677 }, { "name": "model.layers.22.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.140892618423095e-05, "sensitivity": 1.4771172986162353 }, { "name": "model.layers.22.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.235104817482352e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.844766565132886e-05, "sensitivity": 0.6902943360675445 }, { "name": "model.layers.22.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1369505045877304e-05, "sensitivity": 1.223487706050514 }, { "name": "model.layers.22.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.682168418592482e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000683480582665652, "sensitivity": 0.5142055952849968 }, { "name": "model.layers.22.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1346650353516452e-05, "sensitivity": 1.2080392934177522 }, { "name": "model.layers.22.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.482274557129131e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006929466035217047, "sensitivity": 0.5384676250720434 }, { "name": "model.layers.22.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0431626479839906e-05, "sensitivity": 0.7961475076026204 }, { "name": "model.layers.22.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.048578254398308e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.1097439710283652e-05, "sensitivity": 1.2150817957415367 }, { "name": "model.layers.22.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0472302720882e-05, "sensitivity": 0.7868762509615068 }, { "name": "model.layers.22.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2184758588773548e-06, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006675118347629905, "sensitivity": 0.5550824361880548 }, { "name": "model.layers.22.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.974400482955389e-05, "sensitivity": 0.8872055494691227 }, { "name": "model.layers.22.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.016169891154277e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8037428971147165e-05, "sensitivity": 0.6159250152935878 }, { "name": "model.layers.22.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0642168490448967e-05, "sensitivity": 1.7828401202531037 }, { "name": "model.layers.22.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0724006642703898e-06, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.63515568501316e-05, "sensitivity": 0.8935013505815995 }, { "name": "model.layers.22.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.656555342487991e-05, "sensitivity": 1.0456408203187184 }, { "name": "model.layers.22.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.021084585772769e-06, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00078695232514292, "sensitivity": 0.5863430661568206 }, { "name": "model.layers.22.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.89020928600803e-05, "sensitivity": 0.9534578861171656 }, { "name": "model.layers.22.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.9791244666485e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006519048474729061, "sensitivity": 0.5839464336355608 }, { "name": "model.layers.22.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0605544048303273e-05, "sensitivity": 1.4958930512609527 }, { "name": "model.layers.22.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.618017434651847e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7752062275540084e-05, "sensitivity": 0.6939942943588301 }, { "name": "model.layers.22.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1237374565098435e-05, "sensitivity": 1.314535137599238 }, { "name": "model.layers.22.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.37388211544021e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000686120125465095, "sensitivity": 0.5338432669317794 }, { "name": "model.layers.22.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.153186404844746e-05, "sensitivity": 0.8200776520695697 }, { "name": "model.layers.22.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.728510240667674e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006930383387953043, "sensitivity": 0.5129730418476924 }, { "name": "model.layers.22.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.799957943963818e-05, "sensitivity": 0.9908800571694502 }, { "name": "model.layers.22.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.267640509984631e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006350053008645773, "sensitivity": 0.5164301875345324 }, { "name": "model.layers.22.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.082585185940843e-05, "sensitivity": 1.6754269175694971 }, { "name": "model.layers.22.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.013651952547661e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.892355693504214e-05, "sensitivity": 0.7312412486972154 }, { "name": "model.layers.22.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.56390659767203e-05, "sensitivity": 0.8863351862902266 }, { "name": "model.layers.22.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.589617444456962e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006184853264130652, "sensitivity": 0.5051559251716705 }, { "name": "model.layers.22.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.885845429380424e-06, "sensitivity": 1.5075894270006305 }, { "name": "model.layers.22.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.500391466739529e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005972343496978283, "sensitivity": 0.537126667807763 }, { "name": "model.layers.22.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.338371192920022e-05, "sensitivity": 0.9436815487719153 }, { "name": "model.layers.22.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.395060043156263e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.1940802222816274e-05, "sensitivity": 0.708979275086528 }, { "name": "model.layers.22.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.732461042702198e-05, "sensitivity": 0.8955151414200511 }, { "name": "model.layers.22.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.632192359276814e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.989724352024496e-05, "sensitivity": 0.8226693272360504 }, { "name": "model.layers.22.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0563817340880632e-05, "sensitivity": 1.7494980889471252 }, { "name": "model.layers.22.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.028306410778896e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7864577684085816e-05, "sensitivity": 1.1591246934646517 }, { "name": "model.layers.22.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8767891459865496e-05, "sensitivity": 1.0017397619736792 }, { "name": "model.layers.22.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.561466190963984e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000665161176584661, "sensitivity": 0.5302874364624178 }, { "name": "model.layers.22.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0696282162098214e-05, "sensitivity": 0.6513029535247876 }, { "name": "model.layers.22.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.735765166216879e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006683942629024386, "sensitivity": 0.5555399238038377 }, { "name": "model.layers.22.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 3.8034768294892274e-06, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.46106242229871e-06, "sensitivity": 2.0996964644812257 }, { "name": "model.layers.22.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.044948577255127e-07, "sensitivity": 10.0 }, { "name": "model.layers.22.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 8.600967703387141e-06, "sensitivity": 1.6482784280074676 }, { "name": "model.layers.22.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 2.7693076845025644e-05, "sensitivity": 1.6086821538531093 }, { "name": "model.layers.22.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.0001773597177816555, "sensitivity": 0.9708254655408286 }, { "name": "model.layers.22.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.5107136277947575e-05, "sensitivity": 1.3416098007019635 }, { "name": "model.layers.22.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.886990038561635e-05, "sensitivity": 0.7131944384569984 }, { "name": "model.layers.22.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002624464686959982, "sensitivity": 0.7164823237599173 }, { "name": "model.layers.23.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0344770089432131e-05, "sensitivity": 1.5194623680602186 }, { "name": "model.layers.23.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.972101687097165e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6620057875989005e-05, "sensitivity": 0.8099467798314249 }, { "name": "model.layers.23.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.798436905024573e-05, "sensitivity": 1.1802072109247421 }, { "name": "model.layers.23.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.053737019508844e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006465916521847248, "sensitivity": 0.5407696985671706 }, { "name": "model.layers.23.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9053149016108364e-05, "sensitivity": 0.7798696515253496 }, { "name": "model.layers.23.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1584390904317843e-06, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.893657362321392e-05, "sensitivity": 0.7025216735954837 }, { "name": "model.layers.23.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.968369805486873e-05, "sensitivity": 0.6331506381337162 }, { "name": "model.layers.23.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.475256325051305e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.967367178527638e-05, "sensitivity": 0.6149050173845396 }, { "name": "model.layers.23.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.839138611918315e-05, "sensitivity": 0.7234902885809288 }, { "name": "model.layers.23.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.423817234870512e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000662479258608073, "sensitivity": 0.5315885651419796 }, { "name": "model.layers.23.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006731246830895543, "sensitivity": 0.5829385991034397 }, { "name": "model.layers.23.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.101388632690941e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006843781447969377, "sensitivity": 0.5459808695991265 }, { "name": "model.layers.23.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.465174374170601e-05, "sensitivity": 0.9254648759080065 }, { "name": "model.layers.23.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.437041631419561e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007354131666943431, "sensitivity": 0.5204560499137848 }, { "name": "model.layers.23.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8443845773581415e-05, "sensitivity": 0.6900153898584416 }, { "name": "model.layers.23.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.149862770143955e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000630149501375854, "sensitivity": 0.5449572336200611 }, { "name": "model.layers.23.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.855241761310026e-05, "sensitivity": 0.9740901538351319 }, { "name": "model.layers.23.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.223286502267001e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8324098063167185e-05, "sensitivity": 0.6907986423650871 }, { "name": "model.layers.23.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007308712229132652, "sensitivity": 0.5850234997915367 }, { "name": "model.layers.23.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.369010740556405e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007723450544290245, "sensitivity": 0.5584750705410588 }, { "name": "model.layers.23.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.163332727737725e-05, "sensitivity": 0.8090881845454014 }, { "name": "model.layers.23.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.593532013241202e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.331225449685007e-05, "sensitivity": 0.7615802767329417 }, { "name": "model.layers.23.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.735422018915415e-05, "sensitivity": 1.0389225779963935 }, { "name": "model.layers.23.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.076163572288351e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006445469916798174, "sensitivity": 0.547177579177943 }, { "name": "model.layers.23.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7498102250974625e-05, "sensitivity": 0.7202523338434988 }, { "name": "model.layers.23.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.572108190994186e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006437463453039527, "sensitivity": 0.5747571934558269 }, { "name": "model.layers.23.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1325179002596997e-05, "sensitivity": 1.987920095991545 }, { "name": "model.layers.23.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.974173286129371e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.054944242350757e-05, "sensitivity": 0.6512364315351131 }, { "name": "model.layers.23.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.734761361964047e-05, "sensitivity": 1.0387054651898644 }, { "name": "model.layers.23.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.376187116075016e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006259295041672885, "sensitivity": 0.5252295845267203 }, { "name": "model.layers.23.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.389809277607128e-05, "sensitivity": 0.6399782859720696 }, { "name": "model.layers.23.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.727535825732048e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.403546285582706e-05, "sensitivity": 0.7493024997693607 }, { "name": "model.layers.23.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6457327445968986e-05, "sensitivity": 0.6122299494613926 }, { "name": "model.layers.23.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0396089464848046e-06, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006270084413699806, "sensitivity": 0.5282887593032334 }, { "name": "model.layers.23.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.947591125732288e-05, "sensitivity": 0.9327136112730321 }, { "name": "model.layers.23.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.625344894928276e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006714216433465481, "sensitivity": 0.5854103474839663 }, { "name": "model.layers.23.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.689120345981792e-05, "sensitivity": 0.8182049723496883 }, { "name": "model.layers.23.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.007185445218056e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007574408082291484, "sensitivity": 0.5866569752687196 }, { "name": "model.layers.23.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1368038940418046e-05, "sensitivity": 1.5985122811774852 }, { "name": "model.layers.23.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.825770123621623e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.071916868677363e-05, "sensitivity": 0.7154548556375024 }, { "name": "model.layers.23.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.845763371326029e-05, "sensitivity": 0.6326880284135424 }, { "name": "model.layers.23.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.976515234986437e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7839024520944804e-05, "sensitivity": 0.9150978326954551 }, { "name": "model.layers.23.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006567409145645797, "sensitivity": 0.5703766354537058 }, { "name": "model.layers.23.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.988771244527015e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006348647875711322, "sensitivity": 0.5657077060360924 }, { "name": "model.layers.23.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0848302382510155e-05, "sensitivity": 0.7985769552937871 }, { "name": "model.layers.23.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.878710223645612e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006547847297042608, "sensitivity": 0.5406073092503514 }, { "name": "model.layers.23.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0666908565326594e-05, "sensitivity": 1.7568588880858418 }, { "name": "model.layers.23.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.991151053625799e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006521636387333274, "sensitivity": 0.545379176901954 }, { "name": "model.layers.23.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9881331253563985e-05, "sensitivity": 1.0899271601975011 }, { "name": "model.layers.23.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.40544123800646e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006692990427836776, "sensitivity": 0.5494588937905218 }, { "name": "model.layers.23.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.879232776351273e-05, "sensitivity": 0.8106012695415316 }, { "name": "model.layers.23.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.295632033470611e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006546465447172523, "sensitivity": 0.5308143932456463 }, { "name": "model.layers.23.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7730834669200704e-05, "sensitivity": 0.8455102166877334 }, { "name": "model.layers.23.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.560132300772239e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.407911885413341e-05, "sensitivity": 0.6459628123871882 }, { "name": "model.layers.23.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.408502667909488e-05, "sensitivity": 0.7391221263922982 }, { "name": "model.layers.23.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.891662789916154e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.435107934521511e-05, "sensitivity": 0.7727401931709401 }, { "name": "model.layers.23.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1191611520189326e-05, "sensitivity": 1.701589804272902 }, { "name": "model.layers.23.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.59958197704691e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0106754972366616e-05, "sensitivity": 0.6283119387103795 }, { "name": "model.layers.23.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.551648064283654e-05, "sensitivity": 0.9535833665992497 }, { "name": "model.layers.23.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.50962419967982e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006053246324881911, "sensitivity": 0.5258176047548305 }, { "name": "model.layers.23.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.295957427937537e-05, "sensitivity": 0.7311575489518543 }, { "name": "model.layers.23.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.713862709759269e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007193150813691318, "sensitivity": 0.5742119652763369 }, { "name": "model.layers.23.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.042717723175883e-05, "sensitivity": 0.9414144913039996 }, { "name": "model.layers.23.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.212848001676321e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.012164521962404e-05, "sensitivity": 0.6178189584342826 }, { "name": "model.layers.23.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0573603503871709e-05, "sensitivity": 1.4148434419702227 }, { "name": "model.layers.23.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.089459247959894e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006368387257680297, "sensitivity": 0.5225359640847094 }, { "name": "model.layers.23.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.935625813435763e-05, "sensitivity": 0.6747077547165619 }, { "name": "model.layers.23.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.542618050138117e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006606288952752948, "sensitivity": 0.5473435111469347 }, { "name": "model.layers.23.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.404926534742117e-05, "sensitivity": 0.8899763051698821 }, { "name": "model.layers.23.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.671967179907369e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.300906534306705e-05, "sensitivity": 0.600380698401833 }, { "name": "model.layers.23.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.015099279466085e-05, "sensitivity": 0.816960628129437 }, { "name": "model.layers.23.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.472411655522592e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006699608638882637, "sensitivity": 0.5821121422874357 }, { "name": "model.layers.23.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.389273792388849e-05, "sensitivity": 0.6313974277669374 }, { "name": "model.layers.23.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.976168040433549e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006152235437184572, "sensitivity": 0.586383065151956 }, { "name": "model.layers.23.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.399668200174347e-05, "sensitivity": 0.9940653674707804 }, { "name": "model.layers.23.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.917273023849702e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007643412100151181, "sensitivity": 0.5771344490527444 }, { "name": "model.layers.23.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0907485375355463e-05, "sensitivity": 1.4598568322800671 }, { "name": "model.layers.23.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.800564046396175e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5692315072519705e-05, "sensitivity": 0.7275793084576685 }, { "name": "model.layers.23.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.083292464609258e-05, "sensitivity": 1.1272612840394125 }, { "name": "model.layers.23.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.126334023472737e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.181707431096584e-05, "sensitivity": 0.8710483636421799 }, { "name": "model.layers.23.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.230451253941283e-05, "sensitivity": 0.8364537727195583 }, { "name": "model.layers.23.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.395862778343144e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007110959850251675, "sensitivity": 0.5194094661328419 }, { "name": "model.layers.23.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1245319001318421e-05, "sensitivity": 1.3832111206010302 }, { "name": "model.layers.23.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.473218369748793e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006979455938562751, "sensitivity": 0.5748708793533971 }, { "name": "model.layers.23.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.201693759066984e-05, "sensitivity": 1.1494530558457474 }, { "name": "model.layers.23.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.804853001085576e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006895688129588962, "sensitivity": 0.5954026503269555 }, { "name": "model.layers.23.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.206110573548358e-05, "sensitivity": 1.4599017219590174 }, { "name": "model.layers.23.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.246200781679363e-06, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.551800470333546e-05, "sensitivity": 0.8261366257562447 }, { "name": "model.layers.23.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0060684871859848e-05, "sensitivity": 1.9725452279880398 }, { "name": "model.layers.23.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.311898914646008e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.208549555391073e-05, "sensitivity": 0.6794733054360207 }, { "name": "model.layers.23.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.904023419134319e-05, "sensitivity": 0.8533573873948748 }, { "name": "model.layers.23.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.429813765862491e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006444841856136918, "sensitivity": 0.5407334537006119 }, { "name": "model.layers.23.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.47583622392267e-05, "sensitivity": 1.0912380550073626 }, { "name": "model.layers.23.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.69008784370817e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006082548061385751, "sensitivity": 0.5270244483420728 }, { "name": "model.layers.23.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.762826185673475e-05, "sensitivity": 1.1961303692694545 }, { "name": "model.layers.23.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.276253649659338e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006592716090381145, "sensitivity": 0.5635429416214035 }, { "name": "model.layers.23.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1133539373986423e-05, "sensitivity": 1.608687981314394 }, { "name": "model.layers.23.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.016695798891305e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.116547592682764e-05, "sensitivity": 0.6310444527648402 }, { "name": "model.layers.23.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.060164014343172e-05, "sensitivity": 0.9353490282968993 }, { "name": "model.layers.23.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.526051604145323e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000683646067045629, "sensitivity": 0.5494155797572733 }, { "name": "model.layers.23.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.790566501673311e-05, "sensitivity": 0.7976481127560685 }, { "name": "model.layers.23.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.688896974083036e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.765180685557425e-05, "sensitivity": 0.7379909246330951 }, { "name": "model.layers.23.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.364659591577947e-05, "sensitivity": 0.8815622405654898 }, { "name": "model.layers.23.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.26893574665155e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.198080907575786e-05, "sensitivity": 0.9165106798231014 }, { "name": "model.layers.23.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7623656175564975e-05, "sensitivity": 0.7959622603557931 }, { "name": "model.layers.23.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.85663758051669e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006553898565471172, "sensitivity": 0.5240360123057535 }, { "name": "model.layers.23.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0623715752444696e-05, "sensitivity": 1.5529395909487436 }, { "name": "model.layers.23.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.937719033179746e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.827764834975824e-05, "sensitivity": 0.9891454583356069 }, { "name": "model.layers.23.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.022103480063379e-05, "sensitivity": 1.1310886239630578 }, { "name": "model.layers.23.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2074810911144596e-06, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.134886643849313e-05, "sensitivity": 0.9520962296511072 }, { "name": "model.layers.23.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.787921691080555e-05, "sensitivity": 0.7542097835251735 }, { "name": "model.layers.23.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.574249932280509e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000647238630335778, "sensitivity": 0.5362168616936781 }, { "name": "model.layers.23.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6341232266277075e-05, "sensitivity": 0.9510503105197246 }, { "name": "model.layers.23.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.251464921864681e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000620881502982229, "sensitivity": 0.5878523916127308 }, { "name": "model.layers.23.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.860783130628988e-05, "sensitivity": 0.8261243888233641 }, { "name": "model.layers.23.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.001381507303449e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006395687814801931, "sensitivity": 0.5221573542942948 }, { "name": "model.layers.23.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.502608837559819e-05, "sensitivity": 0.9753307117944833 }, { "name": "model.layers.23.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.92521814724023e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.355502071324736e-05, "sensitivity": 0.6257292339431655 }, { "name": "model.layers.23.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.149370165076107e-05, "sensitivity": 0.9846719403853545 }, { "name": "model.layers.23.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.392737870759447e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006734089693054557, "sensitivity": 0.5861094716957109 }, { "name": "model.layers.23.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8694975450634956e-05, "sensitivity": 0.6419246145981509 }, { "name": "model.layers.23.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.034480967784475e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00066488201264292, "sensitivity": 0.5452565258251397 }, { "name": "model.layers.23.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.439764547394589e-05, "sensitivity": 1.0333184529058272 }, { "name": "model.layers.23.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.722758479962067e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007382944459095597, "sensitivity": 0.5452297900109437 }, { "name": "model.layers.23.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.637526530539617e-05, "sensitivity": 1.0154652424565567 }, { "name": "model.layers.23.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.62149170441262e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.713804032187909e-05, "sensitivity": 0.6738393318943545 }, { "name": "model.layers.23.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.69842777622398e-05, "sensitivity": 1.1432429899809091 }, { "name": "model.layers.23.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.54938844490971e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006202874938026071, "sensitivity": 0.5134257167038849 }, { "name": "model.layers.23.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 4.106113010493573e-06, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.584149665897712e-06, "sensitivity": 1.9805164116591907 }, { "name": "model.layers.23.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.770854265094385e-07, "sensitivity": 10.0 }, { "name": "model.layers.23.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 2.115526285706437e-06, "sensitivity": 2.103942094838983 }, { "name": "model.layers.23.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 6.459436917793937e-06, "sensitivity": 2.001088489728363 }, { "name": "model.layers.23.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00016866796067915857, "sensitivity": 0.9043927123252187 }, { "name": "model.layers.23.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.3943327758170199e-05, "sensitivity": 0.9641423448274783 }, { "name": "model.layers.23.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 4, "mse": 1.1663777513604145e-05, "sensitivity": 1.4523839266687488 }, { "name": "model.layers.23.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.000247941876295954, "sensitivity": 0.7656354394975902 }, { "name": "model.layers.24.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3101101760403253e-06, "sensitivity": 2.097498756429942 }, { "name": "model.layers.24.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.166096788248979e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006460563745349646, "sensitivity": 0.5822346385488447 }, { "name": "model.layers.24.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.239144568098709e-05, "sensitivity": 0.8419268987271631 }, { "name": "model.layers.24.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.13512577021902e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000701237004250288, "sensitivity": 0.5340104688834474 }, { "name": "model.layers.24.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.567063271882944e-05, "sensitivity": 1.075776186682438 }, { "name": "model.layers.24.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0221291404377553e-06, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.724414222640917e-05, "sensitivity": 0.6238970051273653 }, { "name": "model.layers.24.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1388836355763488e-05, "sensitivity": 1.476937638234124 }, { "name": "model.layers.24.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.754909804840281e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7280045439256355e-05, "sensitivity": 0.7365326791978575 }, { "name": "model.layers.24.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8917197748087347e-05, "sensitivity": 0.7919049149805171 }, { "name": "model.layers.24.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.225620268196508e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006562242051586509, "sensitivity": 0.5502417761636298 }, { "name": "model.layers.24.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.126459629740566e-05, "sensitivity": 0.9411614469465197 }, { "name": "model.layers.24.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.313999847407104e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006796446396037936, "sensitivity": 0.5583067123761776 }, { "name": "model.layers.24.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.104196654632688e-05, "sensitivity": 0.6808956853384065 }, { "name": "model.layers.24.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.528709483674902e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.141296762507409e-05, "sensitivity": 0.6052810448423196 }, { "name": "model.layers.24.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.881843728478998e-05, "sensitivity": 1.0969884890372692 }, { "name": "model.layers.24.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.527338988846168e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.026315142866224e-05, "sensitivity": 0.7505424705024761 }, { "name": "model.layers.24.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.19579732301645e-05, "sensitivity": 0.7653969001937377 }, { "name": "model.layers.24.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.451030109630665e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.180327909532934e-05, "sensitivity": 0.62838929593993 }, { "name": "model.layers.24.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.19618222117424e-05, "sensitivity": 0.9536534773642711 }, { "name": "model.layers.24.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.862980737627367e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000681792851537466, "sensitivity": 0.5121415048969691 }, { "name": "model.layers.24.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.377277951381984e-06, "sensitivity": 2.0971398448596315 }, { "name": "model.layers.24.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.087228712203796e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.637483991449699e-05, "sensitivity": 0.8367330787007305 }, { "name": "model.layers.24.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006845964817330241, "sensitivity": 0.5788298693710906 }, { "name": "model.layers.24.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.739252285115072e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006864133174531162, "sensitivity": 0.5247952235783319 }, { "name": "model.layers.24.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.281426612986252e-05, "sensitivity": 0.9186774728603584 }, { "name": "model.layers.24.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0829402299350477e-06, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.345783185679466e-05, "sensitivity": 0.6500530527072678 }, { "name": "model.layers.24.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.098053326131776e-05, "sensitivity": 1.7576605422890417 }, { "name": "model.layers.24.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.737512982610497e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8556739531923085e-05, "sensitivity": 0.7566216553860602 }, { "name": "model.layers.24.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.182257493492216e-05, "sensitivity": 1.124029333124639 }, { "name": "model.layers.24.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.221560960919305e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.27022236585617e-05, "sensitivity": 0.729859516950556 }, { "name": "model.layers.24.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.990046702208929e-05, "sensitivity": 0.6712516084924582 }, { "name": "model.layers.24.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.412969580400386e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006706073763780296, "sensitivity": 0.5697078914955702 }, { "name": "model.layers.24.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9829482779605314e-05, "sensitivity": 0.6399838696236848 }, { "name": "model.layers.24.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.75678017816972e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000674064620397985, "sensitivity": 0.5503889236785967 }, { "name": "model.layers.24.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.074592728400603e-05, "sensitivity": 1.210066734533182 }, { "name": "model.layers.24.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.96288122223632e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.016989209456369e-05, "sensitivity": 0.6042026914884189 }, { "name": "model.layers.24.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.23895030003041e-05, "sensitivity": 1.1950439471455778 }, { "name": "model.layers.24.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.630090976817883e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000698382849805057, "sensitivity": 0.541293369645206 }, { "name": "model.layers.24.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.3548818060371559e-05, "sensitivity": 1.313149006493195 }, { "name": "model.layers.24.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.878849490021821e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.107302371878177e-05, "sensitivity": 0.8574388053014641 }, { "name": "model.layers.24.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3835850849281996e-05, "sensitivity": 1.1365424828827473 }, { "name": "model.layers.24.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.402996758770314e-06, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.535260424949229e-05, "sensitivity": 0.8371759659242822 }, { "name": "model.layers.24.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.898263771086931e-05, "sensitivity": 0.9113514334100313 }, { "name": "model.layers.24.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2283056776141166e-06, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.922736818320118e-05, "sensitivity": 0.8874386103524159 }, { "name": "model.layers.24.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0770268090709578e-05, "sensitivity": 1.4570369457867736 }, { "name": "model.layers.24.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.33263994131994e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006285202107392251, "sensitivity": 0.5741495354073028 }, { "name": "model.layers.24.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1003145118593238e-05, "sensitivity": 1.212075173725774 }, { "name": "model.layers.24.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.576364507462131e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000683597638271749, "sensitivity": 0.5649832509339734 }, { "name": "model.layers.24.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.065877586370334e-05, "sensitivity": 1.2804553872179476 }, { "name": "model.layers.24.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.69165853348386e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006455188849940896, "sensitivity": 0.527263069237397 }, { "name": "model.layers.24.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.38758938293904e-05, "sensitivity": 0.9701758806713681 }, { "name": "model.layers.24.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.689635594942956e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007257977849803865, "sensitivity": 0.5575498435728026 }, { "name": "model.layers.24.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.379558180924505e-05, "sensitivity": 0.633479862693713 }, { "name": "model.layers.24.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.006500138435513e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.424727325793356e-05, "sensitivity": 0.6211253468110328 }, { "name": "model.layers.24.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0721246326284017e-05, "sensitivity": 1.3518969577954791 }, { "name": "model.layers.24.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.301311827883183e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006434733513742685, "sensitivity": 0.5483611292361205 }, { "name": "model.layers.24.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7765544624999166e-05, "sensitivity": 0.9530281586620297 }, { "name": "model.layers.24.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.962465934317152e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000654479255899787, "sensitivity": 0.558429611734185 }, { "name": "model.layers.24.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.293647311395034e-05, "sensitivity": 0.6824504092662931 }, { "name": "model.layers.24.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.2765277536746e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.308119191089645e-05, "sensitivity": 0.6473609417607884 }, { "name": "model.layers.24.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.230151484487578e-05, "sensitivity": 0.786045035999273 }, { "name": "model.layers.24.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.578475222340785e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.253697210922837e-05, "sensitivity": 0.634445163643696 }, { "name": "model.layers.24.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6325672630919144e-05, "sensitivity": 1.1053331657455396 }, { "name": "model.layers.24.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.854134315086412e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006331233307719231, "sensitivity": 0.5400867067219166 }, { "name": "model.layers.24.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0735990144894458e-05, "sensitivity": 1.8083117699560873 }, { "name": "model.layers.24.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.506873900325445e-06, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.502840940607712e-05, "sensitivity": 0.9100078257138581 }, { "name": "model.layers.24.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.868079460924491e-05, "sensitivity": 1.0494545958969714 }, { "name": "model.layers.24.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.619117579655722e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006558973109349608, "sensitivity": 0.5810709301784469 }, { "name": "model.layers.24.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0673756150936242e-05, "sensitivity": 1.2066349701065369 }, { "name": "model.layers.24.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.823955456842668e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006472342065535486, "sensitivity": 0.5521608515462972 }, { "name": "model.layers.24.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.036263584974222e-05, "sensitivity": 0.994337588321382 }, { "name": "model.layers.24.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.74975967235514e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.867867366760038e-05, "sensitivity": 0.753702432917827 }, { "name": "model.layers.24.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0582649894058704e-05, "sensitivity": 0.9633664550910637 }, { "name": "model.layers.24.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.676191557948187e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000666131149046123, "sensitivity": 0.5609909368165344 }, { "name": "model.layers.24.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.99828599661123e-05, "sensitivity": 0.9996903616095623 }, { "name": "model.layers.24.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.510273919957399e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006490254309028387, "sensitivity": 0.5806831536599573 }, { "name": "model.layers.24.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.116055737948045e-05, "sensitivity": 1.1638283119288924 }, { "name": "model.layers.24.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.127702812998905e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006891604280099273, "sensitivity": 0.5283744765108511 }, { "name": "model.layers.24.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0957405720546376e-05, "sensitivity": 1.2149797354096572 }, { "name": "model.layers.24.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.181051842053421e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006686467677354813, "sensitivity": 0.5618212514991637 }, { "name": "model.layers.24.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7066205044975504e-05, "sensitivity": 1.1126727803095082 }, { "name": "model.layers.24.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.40406107979652e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.587047780863941e-05, "sensitivity": 0.729550181187613 }, { "name": "model.layers.24.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0730101166700479e-05, "sensitivity": 1.4753435243166644 }, { "name": "model.layers.24.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3472138107317733e-06, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.415573104983196e-05, "sensitivity": 0.9960226837431138 }, { "name": "model.layers.24.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.990861609461717e-05, "sensitivity": 1.1485472508698686 }, { "name": "model.layers.24.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.694502528465819e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8173289289698005e-05, "sensitivity": 0.6306223194539833 }, { "name": "model.layers.24.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0163108527194709e-05, "sensitivity": 1.599964894251045 }, { "name": "model.layers.24.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.050348702046904e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.4562664445256814e-05, "sensitivity": 0.6166827874974443 }, { "name": "model.layers.24.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.822442108183168e-05, "sensitivity": 1.1979137493980454 }, { "name": "model.layers.24.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.319021395029267e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006293452461250126, "sensitivity": 0.5243806543341578 }, { "name": "model.layers.24.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.056778511265293e-05, "sensitivity": 0.6298051871574949 }, { "name": "model.layers.24.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.083143600539188e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006835462991148233, "sensitivity": 0.551135456602543 }, { "name": "model.layers.24.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.124116352002602e-05, "sensitivity": 1.212751631181938 }, { "name": "model.layers.24.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2752592510878458e-06, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.897781375097111e-05, "sensitivity": 0.9952740060659527 }, { "name": "model.layers.24.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.248210411285982e-05, "sensitivity": 0.7748557148522042 }, { "name": "model.layers.24.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.206530542840483e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006776286172680557, "sensitivity": 0.5538494671792241 }, { "name": "model.layers.24.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0782484423543792e-05, "sensitivity": 1.4106850234790977 }, { "name": "model.layers.24.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.655869123685989e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006525579374283552, "sensitivity": 0.5842808944356076 }, { "name": "model.layers.24.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3476841306546703e-06, "sensitivity": 2.0972166832124017 }, { "name": "model.layers.24.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.907204573915806e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.486647569341585e-05, "sensitivity": 0.8810614361555321 }, { "name": "model.layers.24.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.780210242141038e-05, "sensitivity": 1.0335258205273472 }, { "name": "model.layers.24.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.420611490895681e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.889079668326303e-05, "sensitivity": 0.6305333402819896 }, { "name": "model.layers.24.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.912439519306645e-05, "sensitivity": 0.9605757333577826 }, { "name": "model.layers.24.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.538449947081972e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006573281134478748, "sensitivity": 0.5604943414586883 }, { "name": "model.layers.24.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7212859246646985e-05, "sensitivity": 0.8346824688577925 }, { "name": "model.layers.24.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.99485405877931e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5804059229558334e-05, "sensitivity": 0.6300873937943311 }, { "name": "model.layers.24.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.263878458412364e-05, "sensitivity": 0.939136365055999 }, { "name": "model.layers.24.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.99798340772395e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006797324167564511, "sensitivity": 0.5515761717323965 }, { "name": "model.layers.24.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.742678669979796e-05, "sensitivity": 0.7200637523853529 }, { "name": "model.layers.24.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.808769962342922e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007576106581836939, "sensitivity": 0.5590005969124842 }, { "name": "model.layers.24.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0697312063712161e-05, "sensitivity": 1.3295917516081444 }, { "name": "model.layers.24.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.167903047251457e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000635925680398941, "sensitivity": 0.5942573439408205 }, { "name": "model.layers.24.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1199506843695417e-05, "sensitivity": 1.3092014527289029 }, { "name": "model.layers.24.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3899286841478897e-06, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9886235248995945e-05, "sensitivity": 0.7095641792791587 }, { "name": "model.layers.24.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.664139098371379e-05, "sensitivity": 0.8571310282777946 }, { "name": "model.layers.24.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.193651410692837e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.529048212338239e-05, "sensitivity": 0.684190293664042 }, { "name": "model.layers.24.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.004059105180204e-05, "sensitivity": 0.7645255779930702 }, { "name": "model.layers.24.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.306298582283489e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006880129221826792, "sensitivity": 0.5387919632290868 }, { "name": "model.layers.24.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.230159488040954e-05, "sensitivity": 0.9156547575545235 }, { "name": "model.layers.24.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0040537290478824e-06, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.1015598475933075e-05, "sensitivity": 0.6049721614116705 }, { "name": "model.layers.24.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.245731436938513e-05, "sensitivity": 1.4419565248472832 }, { "name": "model.layers.24.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.423937967767415e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.96554416208528e-05, "sensitivity": 0.8734700975680405 }, { "name": "model.layers.24.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.199470954015851e-05, "sensitivity": 1.0667263595542007 }, { "name": "model.layers.24.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.628411028941628e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006832791259512305, "sensitivity": 0.5470922012191087 }, { "name": "model.layers.24.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.935063381912187e-05, "sensitivity": 0.9619607620254229 }, { "name": "model.layers.24.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.941553121781908e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006706849671900272, "sensitivity": 0.5213310164468583 }, { "name": "model.layers.24.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.600825872737914e-05, "sensitivity": 1.1744746305933358 }, { "name": "model.layers.24.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.518222784914542e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007472659926861525, "sensitivity": 0.5589237175330197 }, { "name": "model.layers.24.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 3.871424269163981e-06, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4003320504562e-06, "sensitivity": 2.101964718526645 }, { "name": "model.layers.24.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.987067990849027e-07, "sensitivity": 10.0 }, { "name": "model.layers.24.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 8.952685675467364e-06, "sensitivity": 1.2515614607251746 }, { "name": "model.layers.24.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 7.875893061282113e-06, "sensitivity": 2.052384444753904 }, { "name": "model.layers.24.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.0001954666804522276, "sensitivity": 0.9159879468535314 }, { "name": "model.layers.24.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.7538728570798412e-05, "sensitivity": 1.1713133590626483 }, { "name": "model.layers.24.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.7663171901367605e-05, "sensitivity": 0.7101762420091022 }, { "name": "model.layers.24.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0003041939053218812, "sensitivity": 1.126339760991559 }, { "name": "model.layers.25.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.286647112574428e-05, "sensitivity": 0.8471455667954055 }, { "name": "model.layers.25.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.872229955159128e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0540995036717504e-05, "sensitivity": 0.6585349612688559 }, { "name": "model.layers.25.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.573334394488484e-05, "sensitivity": 1.128326478689371 }, { "name": "model.layers.25.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3334578170542954e-06, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007252152427099645, "sensitivity": 0.5970338713902094 }, { "name": "model.layers.25.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0478672821773216e-05, "sensitivity": 0.8327409166793602 }, { "name": "model.layers.25.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.957023851507984e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.921353294979781e-05, "sensitivity": 0.6685693729671394 }, { "name": "model.layers.25.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.455922266468406e-05, "sensitivity": 1.1424972387905736 }, { "name": "model.layers.25.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.580217354392516e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000713277782779187, "sensitivity": 0.5342946284060676 }, { "name": "model.layers.25.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.12496369285509e-05, "sensitivity": 0.8183668681277728 }, { "name": "model.layers.25.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.037155569378228e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006749966996721923, "sensitivity": 0.5563694217435456 }, { "name": "model.layers.25.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.359109829645604e-05, "sensitivity": 0.7873669092763788 }, { "name": "model.layers.25.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.262935580205522e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007152028265409172, "sensitivity": 0.5471079440340603 }, { "name": "model.layers.25.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0791198292281479e-05, "sensitivity": 1.3551873658872342 }, { "name": "model.layers.25.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.332358791245497e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006213188753463328, "sensitivity": 0.57077612676805 }, { "name": "model.layers.25.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.622391472570598e-05, "sensitivity": 1.0631425516212347 }, { "name": "model.layers.25.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.76281308894977e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006373782525770366, "sensitivity": 0.5644439969292463 }, { "name": "model.layers.25.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.963730265852064e-05, "sensitivity": 1.011722056180368 }, { "name": "model.layers.25.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.297167823911877e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007766250055283308, "sensitivity": 0.5763564746278718 }, { "name": "model.layers.25.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.2678750863415189e-05, "sensitivity": 1.5744290919975377 }, { "name": "model.layers.25.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.702806439941924e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007705413154326379, "sensitivity": 0.5658629794046814 }, { "name": "model.layers.25.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0460577868798282e-05, "sensitivity": 1.4612759304469225 }, { "name": "model.layers.25.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.496520879612945e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006131215486675501, "sensitivity": 0.5403102176327339 }, { "name": "model.layers.25.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.222935917321593e-05, "sensitivity": 0.6817713486929649 }, { "name": "model.layers.25.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.961325880183722e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006979592144489288, "sensitivity": 0.5427507159965238 }, { "name": "model.layers.25.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.31205621175468e-05, "sensitivity": 0.9853243058463192 }, { "name": "model.layers.25.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.149782158601738e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.365451554302126e-05, "sensitivity": 0.6584945790971879 }, { "name": "model.layers.25.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.557085725944489e-05, "sensitivity": 0.8987599042721266 }, { "name": "model.layers.25.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.744257348145766e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007361824973486364, "sensitivity": 0.5096820129944093 }, { "name": "model.layers.25.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1074920621467754e-05, "sensitivity": 1.2169612408709582 }, { "name": "model.layers.25.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.981093403941486e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006461696466431022, "sensitivity": 0.5621877421279358 }, { "name": "model.layers.25.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.434924580389634e-05, "sensitivity": 0.6857082110218493 }, { "name": "model.layers.25.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.919032896097633e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007239067927002907, "sensitivity": 0.5188313159768583 }, { "name": "model.layers.25.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.11235445830971e-05, "sensitivity": 1.007237311494825 }, { "name": "model.layers.25.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.790399993406027e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006891667726449668, "sensitivity": 0.554976936153453 }, { "name": "model.layers.25.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.647338159382343e-05, "sensitivity": 0.9451881267784535 }, { "name": "model.layers.25.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.924977580842096e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007526649860665202, "sensitivity": 0.5879442045453436 }, { "name": "model.layers.25.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.337511538527906e-05, "sensitivity": 0.91672442654447 }, { "name": "model.layers.25.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.092075975378975e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.2231320296414196e-05, "sensitivity": 0.624316215100591 }, { "name": "model.layers.25.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.300158565863967e-05, "sensitivity": 1.1026023513859604 }, { "name": "model.layers.25.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3727953955822159e-06, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007415349828079343, "sensitivity": 0.5923834468009153 }, { "name": "model.layers.25.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9549092839006335e-05, "sensitivity": 0.6840087995677124 }, { "name": "model.layers.25.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.096685633063316e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006694148178212345, "sensitivity": 0.5341707799588546 }, { "name": "model.layers.25.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006697954377159476, "sensitivity": 0.5848955975805095 }, { "name": "model.layers.25.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.628990488228737e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006618675542995334, "sensitivity": 0.5440968932469578 }, { "name": "model.layers.25.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.796727418783121e-05, "sensitivity": 0.8853917652776598 }, { "name": "model.layers.25.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.437384172386373e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006296419887803495, "sensitivity": 0.5651341927498922 }, { "name": "model.layers.25.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9863243222935125e-05, "sensitivity": 0.9294461627357892 }, { "name": "model.layers.25.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.530850669150823e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006784807774238288, "sensitivity": 0.5029326532326508 }, { "name": "model.layers.25.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.7675014280248433e-06, "sensitivity": 2.0978637382936043 }, { "name": "model.layers.25.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1973803566434071e-06, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.702878115698695e-05, "sensitivity": 0.9690958048197583 }, { "name": "model.layers.25.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4322214358107885e-06, "sensitivity": 2.0974161851797506 }, { "name": "model.layers.25.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.109196644705662e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006256903288885951, "sensitivity": 0.5683746300321879 }, { "name": "model.layers.25.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.042145469109528e-05, "sensitivity": 1.1862684309028797 }, { "name": "model.layers.25.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.639827567298198e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006715126219205558, "sensitivity": 0.5770297128297731 }, { "name": "model.layers.25.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1826191439467948e-05, "sensitivity": 1.2708028899879098 }, { "name": "model.layers.25.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.918103281350341e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007063332013785839, "sensitivity": 0.5500600021803825 }, { "name": "model.layers.25.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9420923207653686e-05, "sensitivity": 1.0949579106828966 }, { "name": "model.layers.25.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.541110562669928e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.889019666938111e-05, "sensitivity": 0.788751412502666 }, { "name": "model.layers.25.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.2414244338287972e-05, "sensitivity": 1.3477447019808597 }, { "name": "model.layers.25.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0329163160349708e-06, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.794578803237528e-05, "sensitivity": 0.7557453314070244 }, { "name": "model.layers.25.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7458324590697885e-05, "sensitivity": 1.0266821943370958 }, { "name": "model.layers.25.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.072519340705185e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006467581260949373, "sensitivity": 0.5230792312805237 }, { "name": "model.layers.25.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.516865687444806e-05, "sensitivity": 0.7404344050137536 }, { "name": "model.layers.25.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.505211669922573e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007447988609783351, "sensitivity": 0.5306202899400626 }, { "name": "model.layers.25.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0121468221768737e-05, "sensitivity": 1.9109391866083592 }, { "name": "model.layers.25.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.631268891193031e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.468084054882638e-05, "sensitivity": 0.6531271462115653 }, { "name": "model.layers.25.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8144269132753834e-05, "sensitivity": 0.8232349463579154 }, { "name": "model.layers.25.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.487388759524038e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006441447767429054, "sensitivity": 0.5401508475229917 }, { "name": "model.layers.25.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.063318141968921e-05, "sensitivity": 1.1354171190244817 }, { "name": "model.layers.25.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.367643999918073e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000668938853777945, "sensitivity": 0.5718355543051027 }, { "name": "model.layers.25.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.258355278987437e-05, "sensitivity": 0.8093694569195755 }, { "name": "model.layers.25.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.359757094287488e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006977439625188708, "sensitivity": 0.5252835715037875 }, { "name": "model.layers.25.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.911683547310531e-05, "sensitivity": 0.7730472237933786 }, { "name": "model.layers.25.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.601362881359819e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000648645160254091, "sensitivity": 0.526662005956213 }, { "name": "model.layers.25.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.6218308347743e-05, "sensitivity": 0.9470506699484725 }, { "name": "model.layers.25.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.834588243189501e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.557442247867584e-05, "sensitivity": 0.7874369602931846 }, { "name": "model.layers.25.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8136363804806024e-05, "sensitivity": 0.9714307034032273 }, { "name": "model.layers.25.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.781023103030748e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006237979396246374, "sensitivity": 0.5588348675745913 }, { "name": "model.layers.25.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.400638812920079e-05, "sensitivity": 0.6705446522226461 }, { "name": "model.layers.25.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.34069260488468e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007089774007909, "sensitivity": 0.5283967094688902 }, { "name": "model.layers.25.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.907401646254584e-05, "sensitivity": 0.8378535603218288 }, { "name": "model.layers.25.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.26877260603942e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006374302320182323, "sensitivity": 0.5227986745868392 }, { "name": "model.layers.25.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1679816452669911e-05, "sensitivity": 1.6965336981590313 }, { "name": "model.layers.25.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.044552618623129e-06, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.039203071850352e-05, "sensitivity": 0.663138489943017 }, { "name": "model.layers.25.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.849884473718703e-05, "sensitivity": 1.0152064993128305 }, { "name": "model.layers.25.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.248533281905111e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006589896511286497, "sensitivity": 0.5410411702998772 }, { "name": "model.layers.25.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.337130616884679e-05, "sensitivity": 0.854042851828322 }, { "name": "model.layers.25.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.681322588519834e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000716469599865377, "sensitivity": 0.5239112077287971 }, { "name": "model.layers.25.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.162043428048491e-05, "sensitivity": 1.0059627554488983 }, { "name": "model.layers.25.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.618364179506898e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.829898873344064e-05, "sensitivity": 0.7489536608692579 }, { "name": "model.layers.25.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1912498848687392e-05, "sensitivity": 1.2104026613334729 }, { "name": "model.layers.25.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0199846656178124e-06, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007224151631817222, "sensitivity": 0.540130739219115 }, { "name": "model.layers.25.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.623871740885079e-05, "sensitivity": 1.1235654188204687 }, { "name": "model.layers.25.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.463877409463748e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007401038310490549, "sensitivity": 0.5518693758939852 }, { "name": "model.layers.25.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0035367267846595e-05, "sensitivity": 1.354559530513249 }, { "name": "model.layers.25.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.783334356441628e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005940498667769134, "sensitivity": 0.5393961992856359 }, { "name": "model.layers.25.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.171649147290736e-05, "sensitivity": 1.1526188464160165 }, { "name": "model.layers.25.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.514349249504448e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9292731748428196e-05, "sensitivity": 0.6069086859657767 }, { "name": "model.layers.25.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.932112253503874e-05, "sensitivity": 0.959065415223597 }, { "name": "model.layers.25.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.540376489283517e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006403631996363401, "sensitivity": 0.5259463446766097 }, { "name": "model.layers.25.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.261478119995445e-05, "sensitivity": 0.8403145748414178 }, { "name": "model.layers.25.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.913360266480595e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006817596731707454, "sensitivity": 0.5908329276900521 }, { "name": "model.layers.25.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.676748332916759e-05, "sensitivity": 0.9488072045020128 }, { "name": "model.layers.25.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.761993063264526e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006417943513952196, "sensitivity": 0.5200728360029869 }, { "name": "model.layers.25.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0705664509441704e-05, "sensitivity": 0.6144474133901939 }, { "name": "model.layers.25.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.655217248408007e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006721611134707928, "sensitivity": 0.5382416665000487 }, { "name": "model.layers.25.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.098694610845996e-05, "sensitivity": 1.4342837308105125 }, { "name": "model.layers.25.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.928292913878977e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006688893772661686, "sensitivity": 0.5327018465554424 }, { "name": "model.layers.25.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.179852789500728e-05, "sensitivity": 1.1160128133976237 }, { "name": "model.layers.25.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.74848649850901e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006896787672303617, "sensitivity": 0.5516972513901114 }, { "name": "model.layers.25.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.28921092255041e-05, "sensitivity": 1.8813081953607635 }, { "name": "model.layers.25.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.406561503055855e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.135453051887453e-05, "sensitivity": 0.9816958375619692 }, { "name": "model.layers.25.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4605019461887423e-06, "sensitivity": 2.0974626367758162 }, { "name": "model.layers.25.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0514595487620682e-06, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.762394721386954e-05, "sensitivity": 0.842897219038038 }, { "name": "model.layers.25.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1097482456534635e-05, "sensitivity": 1.7321853496400759 }, { "name": "model.layers.25.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.638290071554366e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006353583885356784, "sensitivity": 0.5441144175113565 }, { "name": "model.layers.25.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8275862102163956e-05, "sensitivity": 0.6985646976494273 }, { "name": "model.layers.25.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.333352189358266e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.801986117148772e-05, "sensitivity": 0.6767515188787182 }, { "name": "model.layers.25.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.822164530400187e-05, "sensitivity": 1.0966781033818414 }, { "name": "model.layers.25.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.608567441115156e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006657672929577529, "sensitivity": 0.511201281172172 }, { "name": "model.layers.25.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.917781891184859e-05, "sensitivity": 0.8401066248136622 }, { "name": "model.layers.25.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.080526873120107e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8453366364119574e-05, "sensitivity": 0.7581092417365517 }, { "name": "model.layers.25.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0660903171810787e-05, "sensitivity": 1.4999863172859003 }, { "name": "model.layers.25.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.54994220592198e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6482396757928655e-05, "sensitivity": 0.8035750886427779 }, { "name": "model.layers.25.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.283951370278373e-05, "sensitivity": 1.0384848794160542 }, { "name": "model.layers.25.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.231818699438008e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007021225756034255, "sensitivity": 0.5951085137538634 }, { "name": "model.layers.25.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.861831207061186e-05, "sensitivity": 0.8012852605586506 }, { "name": "model.layers.25.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.692386472830549e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007526848348788917, "sensitivity": 0.5968363994876065 }, { "name": "model.layers.25.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 4.615264060703339e-06, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3618731574970298e-06, "sensitivity": 2.101032065467826 }, { "name": "model.layers.25.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.75916009338107e-07, "sensitivity": 10.0 }, { "name": "model.layers.25.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 8.72218151926063e-06, "sensitivity": 1.5931799251240129 }, { "name": "model.layers.25.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 3.307317820144817e-05, "sensitivity": 1.942572236694549 }, { "name": "model.layers.25.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00019686020095832646, "sensitivity": 0.9417370857786393 }, { "name": "model.layers.25.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.448577950213803e-05, "sensitivity": 1.4305350851324847 }, { "name": "model.layers.25.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 2, "mse": 0.0006520400638692081, "sensitivity": 0.5561367319595021 }, { "name": "model.layers.25.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0003004151221830398, "sensitivity": 0.7192584828288666 }, { "name": "model.layers.26.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007007308304309845, "sensitivity": 0.5773103954841726 }, { "name": "model.layers.26.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.922249440322048e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006826593307778239, "sensitivity": 0.51516205027222 }, { "name": "model.layers.26.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.494693661807105e-05, "sensitivity": 0.9957751843989924 }, { "name": "model.layers.26.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.049514121921675e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007489453419111669, "sensitivity": 0.5343168857398419 }, { "name": "model.layers.26.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.997002881485969e-05, "sensitivity": 1.0888956555863443 }, { "name": "model.layers.26.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.736587122053606e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006723866099491715, "sensitivity": 0.5520143362242681 }, { "name": "model.layers.26.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0447851309436373e-05, "sensitivity": 1.8484316306338198 }, { "name": "model.layers.26.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.119775773389847e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.4180236475076526e-05, "sensitivity": 0.6009714906706488 }, { "name": "model.layers.26.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.743294605053961e-05, "sensitivity": 0.6661311707551536 }, { "name": "model.layers.26.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.041889489300956e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006308346055448055, "sensitivity": 0.5415496082601963 }, { "name": "model.layers.26.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.109551759436727e-05, "sensitivity": 1.0661647975559223 }, { "name": "model.layers.26.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.836232273599308e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006897434359416366, "sensitivity": 0.5652756159574523 }, { "name": "model.layers.26.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.730098200729117e-05, "sensitivity": 1.1180043391177226 }, { "name": "model.layers.26.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.490895430033561e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006433876696974039, "sensitivity": 0.5387871228685892 }, { "name": "model.layers.26.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8324811107013375e-05, "sensitivity": 1.146074155343634 }, { "name": "model.layers.26.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.613256005039148e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006714092451147735, "sensitivity": 0.5076094455556991 }, { "name": "model.layers.26.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.840799323981628e-05, "sensitivity": 0.8394437202469865 }, { "name": "model.layers.26.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.822217753528093e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007896681781858206, "sensitivity": 0.5925955523212638 }, { "name": "model.layers.26.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.946693636360578e-05, "sensitivity": 0.7061378660002118 }, { "name": "model.layers.26.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.725131349114235e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006610815762542188, "sensitivity": 0.5311022320588861 }, { "name": "model.layers.26.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5147247621789575e-05, "sensitivity": 0.8455867481507442 }, { "name": "model.layers.26.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.446809379667684e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006240512011572719, "sensitivity": 0.5333685417381823 }, { "name": "model.layers.26.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.122437869431451e-05, "sensitivity": 0.9504782268020985 }, { "name": "model.layers.26.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.343528073353809e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005791670409962535, "sensitivity": 0.5396502073222493 }, { "name": "model.layers.26.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1802845619968139e-05, "sensitivity": 1.6313755662173586 }, { "name": "model.layers.26.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0847852536244318e-06, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006850893842056394, "sensitivity": 0.5696056730264061 }, { "name": "model.layers.26.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.025598612613976e-05, "sensitivity": 1.5175121089145367 }, { "name": "model.layers.26.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.183715524661238e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006164765218272805, "sensitivity": 0.5271726884645341 }, { "name": "model.layers.26.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.927102392888628e-05, "sensitivity": 0.749770497812392 }, { "name": "model.layers.26.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.381018238243996e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006613103905692697, "sensitivity": 0.5381260922371971 }, { "name": "model.layers.26.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.374707299983129e-05, "sensitivity": 0.6203640327993435 }, { "name": "model.layers.26.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.861178007966373e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007295961841009557, "sensitivity": 0.5474890893073727 }, { "name": "model.layers.26.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.026610243570758e-05, "sensitivity": 1.2536853950603322 }, { "name": "model.layers.26.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.4169280373535e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6732089433353394e-05, "sensitivity": 0.6953680475033642 }, { "name": "model.layers.26.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.403741281246766e-05, "sensitivity": 0.6257804485384524 }, { "name": "model.layers.26.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.017271054290177e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007121781818568707, "sensitivity": 0.540907720495388 }, { "name": "model.layers.26.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8892845117952675e-05, "sensitivity": 0.9934968204255141 }, { "name": "model.layers.26.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.719297971358174e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006369092734530568, "sensitivity": 0.5641537739688777 }, { "name": "model.layers.26.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.821870217914693e-05, "sensitivity": 0.9481442407714711 }, { "name": "model.layers.26.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.440008857884095e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006593175930902362, "sensitivity": 0.5189045181066165 }, { "name": "model.layers.26.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4539758669561706e-06, "sensitivity": 2.097500271719418 }, { "name": "model.layers.26.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3739788755628979e-06, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.4762145737186074e-05, "sensitivity": 0.8009288227365433 }, { "name": "model.layers.26.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.33706949884072e-05, "sensitivity": 0.8969954246973174 }, { "name": "model.layers.26.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.610607776266988e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000700620177667588, "sensitivity": 0.5363925268029777 }, { "name": "model.layers.26.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7146549806930125e-05, "sensitivity": 0.7615099366982612 }, { "name": "model.layers.26.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.891072530379461e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006356819067150354, "sensitivity": 0.5403539982920995 }, { "name": "model.layers.26.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.854754610685632e-05, "sensitivity": 0.7480215177072145 }, { "name": "model.layers.26.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.194596148314304e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007931017316877842, "sensitivity": 0.5716835376979057 }, { "name": "model.layers.26.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.870885433978401e-05, "sensitivity": 1.070076537501205 }, { "name": "model.layers.26.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.255351874846383e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006672201561741531, "sensitivity": 0.5288018868547831 }, { "name": "model.layers.26.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4532437237212434e-06, "sensitivity": 2.0971968422820995 }, { "name": "model.layers.26.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.514305823657196e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006610476411879063, "sensitivity": 0.5737053930284097 }, { "name": "model.layers.26.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.852452522958629e-05, "sensitivity": 0.9742023955881975 }, { "name": "model.layers.26.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.490027087442286e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7144672609865665e-05, "sensitivity": 0.6384735295058241 }, { "name": "model.layers.26.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.429819040931761e-05, "sensitivity": 1.123827473644933 }, { "name": "model.layers.26.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.083004215426627e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007192158373072743, "sensitivity": 0.5917919361627515 }, { "name": "model.layers.26.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0525759181473404e-05, "sensitivity": 0.8901392433179144 }, { "name": "model.layers.26.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0460003068146762e-06, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006799520342610776, "sensitivity": 0.5474172387340495 }, { "name": "model.layers.26.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.252655293792486e-05, "sensitivity": 0.9646515316474938 }, { "name": "model.layers.26.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.459434527845588e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006882669404149055, "sensitivity": 0.5330408502299124 }, { "name": "model.layers.26.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.410731293726712e-05, "sensitivity": 0.8818156597715803 }, { "name": "model.layers.26.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.920179309119703e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007077368791215122, "sensitivity": 0.557013759676577 }, { "name": "model.layers.26.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.293944898061454e-05, "sensitivity": 0.6160327572461622 }, { "name": "model.layers.26.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.997184863801522e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007040548953227699, "sensitivity": 0.5274621985797522 }, { "name": "model.layers.26.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1285452274023555e-05, "sensitivity": 1.636799496861495 }, { "name": "model.layers.26.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.504160859956755e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006848671473562717, "sensitivity": 0.5137228982716278 }, { "name": "model.layers.26.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.987211625324562e-05, "sensitivity": 0.7503984092907282 }, { "name": "model.layers.26.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.147266387619311e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006635044701397419, "sensitivity": 0.5223547291368078 }, { "name": "model.layers.26.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8292811445426196e-05, "sensitivity": 0.8535857909594626 }, { "name": "model.layers.26.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.172399586532265e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006488862563855946, "sensitivity": 0.5187574136491341 }, { "name": "model.layers.26.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7008037401828915e-05, "sensitivity": 0.6607011377730527 }, { "name": "model.layers.26.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.081651804379362e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000639228499494493, "sensitivity": 0.5281131245318267 }, { "name": "model.layers.26.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1334846021782141e-05, "sensitivity": 1.3476312737522704 }, { "name": "model.layers.26.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.904280548449606e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006778526003472507, "sensitivity": 0.5974220955672687 }, { "name": "model.layers.26.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1016533790098038e-05, "sensitivity": 1.7832982831628232 }, { "name": "model.layers.26.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.431939247406262e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006674609030596912, "sensitivity": 0.5767625735124704 }, { "name": "model.layers.26.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0342572750232648e-05, "sensitivity": 1.3413954059640778 }, { "name": "model.layers.26.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.276616997842211e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006198016926646233, "sensitivity": 0.5464895541119174 }, { "name": "model.layers.26.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1058862583013251e-05, "sensitivity": 1.5794480077576944 }, { "name": "model.layers.26.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2308348686929094e-06, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.717131352867e-05, "sensitivity": 0.6055437927672602 }, { "name": "model.layers.26.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.968813249841332e-05, "sensitivity": 0.7826825503936196 }, { "name": "model.layers.26.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3527358078135876e-06, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000779744703322649, "sensitivity": 0.5591465040025525 }, { "name": "model.layers.26.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.925360164837912e-05, "sensitivity": 1.1250238466498101 }, { "name": "model.layers.26.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4186114185577026e-06, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6992063036886975e-05, "sensitivity": 0.7780466636854336 }, { "name": "model.layers.26.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.502835847437382e-05, "sensitivity": 0.886137305129233 }, { "name": "model.layers.26.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.888290045026224e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006199441268108785, "sensitivity": 0.5696660474839033 }, { "name": "model.layers.26.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.983981100143865e-05, "sensitivity": 1.068725652929743 }, { "name": "model.layers.26.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.31129318864987e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8047597121912986e-05, "sensitivity": 0.8691835449653275 }, { "name": "model.layers.26.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.04926681262441e-05, "sensitivity": 0.6656224731767797 }, { "name": "model.layers.26.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.634088206032175e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00066728750243783, "sensitivity": 0.5164341496143652 }, { "name": "model.layers.26.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.108822708483785e-05, "sensitivity": 0.8994951328998599 }, { "name": "model.layers.26.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.867962151271058e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.008036871207878e-05, "sensitivity": 0.6381249711729056 }, { "name": "model.layers.26.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.068296715966426e-05, "sensitivity": 0.8309177849770765 }, { "name": "model.layers.26.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.9453169493936e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.944628719589673e-05, "sensitivity": 0.6241201601428317 }, { "name": "model.layers.26.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8695026382338256e-05, "sensitivity": 0.6162294712324463 }, { "name": "model.layers.26.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.835137007030426e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006616695318371058, "sensitivity": 0.5354274121599369 }, { "name": "model.layers.26.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.971203790977597e-05, "sensitivity": 0.739914914323999 }, { "name": "model.layers.26.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.643673486905755e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006641644868068397, "sensitivity": 0.5275381009133806 }, { "name": "model.layers.26.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.648268036864465e-06, "sensitivity": 2.0211862783162826 }, { "name": "model.layers.26.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.986463282984914e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.508063233923167e-05, "sensitivity": 0.6385563386622441 }, { "name": "model.layers.26.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0568035577307455e-05, "sensitivity": 1.8983488337788532 }, { "name": "model.layers.26.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.68668473433354e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006395919481292367, "sensitivity": 0.5406928877771322 }, { "name": "model.layers.26.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.876376962987706e-05, "sensitivity": 0.7891032467426481 }, { "name": "model.layers.26.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.524720674860873e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006512111867778003, "sensitivity": 0.5243822804852416 }, { "name": "model.layers.26.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.204770033946261e-05, "sensitivity": 0.8407429944419533 }, { "name": "model.layers.26.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.743633432255592e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006865378236398101, "sensitivity": 0.5575558262629976 }, { "name": "model.layers.26.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006220788927748799, "sensitivity": 0.5981480719612228 }, { "name": "model.layers.26.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.280528168645105e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006269393488764763, "sensitivity": 0.5098885095615602 }, { "name": "model.layers.26.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.139402103144675e-05, "sensitivity": 0.7215968811919413 }, { "name": "model.layers.26.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.4223197543688e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007016627350822091, "sensitivity": 0.5309104917845455 }, { "name": "model.layers.26.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0670994015526958e-05, "sensitivity": 1.2511312019689906 }, { "name": "model.layers.26.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.746031880946248e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006563750794157386, "sensitivity": 0.5476073091812773 }, { "name": "model.layers.26.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.2894523024442606e-05, "sensitivity": 1.4521395447324248 }, { "name": "model.layers.26.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.734033940527297e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008174054673872888, "sensitivity": 0.5807115751074979 }, { "name": "model.layers.26.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.901339682168327e-05, "sensitivity": 0.7594414767316222 }, { "name": "model.layers.26.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.220046427391935e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006497324211522937, "sensitivity": 0.5170585439744774 }, { "name": "model.layers.26.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.162439240142703e-05, "sensitivity": 0.8055247983949736 }, { "name": "model.layers.26.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.442383088753559e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.139279139460996e-05, "sensitivity": 0.7063777500625144 }, { "name": "model.layers.26.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.078993227565661e-05, "sensitivity": 1.720789838217995 }, { "name": "model.layers.26.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.555510481121019e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006535305874422193, "sensitivity": 0.524243304308953 }, { "name": "model.layers.26.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.356679659802467e-05, "sensitivity": 0.907474136830013 }, { "name": "model.layers.26.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.796619231863588e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007264696760103106, "sensitivity": 0.57222064381686 }, { "name": "model.layers.26.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9224970755167305e-05, "sensitivity": 0.6919700696071359 }, { "name": "model.layers.26.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.444435823344975e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006548903184011579, "sensitivity": 0.5442624245362361 }, { "name": "model.layers.26.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.057304563000798e-05, "sensitivity": 0.9894751062733376 }, { "name": "model.layers.26.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.12793394086475e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006722828256897628, "sensitivity": 0.5310960260202929 }, { "name": "model.layers.26.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.050320735084824e-05, "sensitivity": 0.755330495189909 }, { "name": "model.layers.26.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0134120884686126e-06, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006652991287410259, "sensitivity": 0.5190852017284493 }, { "name": "model.layers.26.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 3.9943415686138906e-06, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.520831458241446e-06, "sensitivity": 2.101308569190747 }, { "name": "model.layers.26.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.758581770962337e-07, "sensitivity": 10.0 }, { "name": "model.layers.26.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 8.589102435507812e-06, "sensitivity": 1.5537654504761338 }, { "name": "model.layers.26.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 3.87376821890939e-05, "sensitivity": 1.8683685828649303 }, { "name": "model.layers.26.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00017956329975277185, "sensitivity": 0.995086997359052 }, { "name": "model.layers.26.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.7036092685884796e-05, "sensitivity": 0.814660240193715 }, { "name": "model.layers.26.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 2, "mse": 0.0006765212747268379, "sensitivity": 0.5175334307332194 }, { "name": "model.layers.26.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00025791715597733855, "sensitivity": 0.6915713636909062 }, { "name": "model.layers.27.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.384942389559001e-05, "sensitivity": 0.6470266695895885 }, { "name": "model.layers.27.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.740476917206252e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007095946930348873, "sensitivity": 0.555704632122844 }, { "name": "model.layers.27.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.642623727908358e-05, "sensitivity": 0.6827860188874171 }, { "name": "model.layers.27.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.292598525054927e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006332519114948809, "sensitivity": 0.5325993427234137 }, { "name": "model.layers.27.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.868554191896692e-05, "sensitivity": 0.7302426792072144 }, { "name": "model.layers.27.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2064905376973911e-06, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008054152131080627, "sensitivity": 0.5650284706422344 }, { "name": "model.layers.27.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.476628186646849e-05, "sensitivity": 0.7947266626709241 }, { "name": "model.layers.27.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.502703738282435e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.343161658151075e-05, "sensitivity": 0.6212420711593487 }, { "name": "model.layers.27.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6375192798441276e-05, "sensitivity": 0.7518604015650971 }, { "name": "model.layers.27.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.761165647934831e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006241984665393829, "sensitivity": 0.5298102759211607 }, { "name": "model.layers.27.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.822989623993635e-05, "sensitivity": 0.7010153279226249 }, { "name": "model.layers.27.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.667352749900601e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.020569708198309e-05, "sensitivity": 0.6057938044302839 }, { "name": "model.layers.27.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.363321982556954e-06, "sensitivity": 2.0970905973744047 }, { "name": "model.layers.27.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.999322863521229e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.79564475629013e-05, "sensitivity": 0.6959552300138085 }, { "name": "model.layers.27.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.124279752839357e-05, "sensitivity": 0.6087507597349605 }, { "name": "model.layers.27.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.902975767137832e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00068462616764009, "sensitivity": 0.5534448675267053 }, { "name": "model.layers.27.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.2058184438501485e-05, "sensitivity": 1.3461696849105407 }, { "name": "model.layers.27.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0831686267920304e-06, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007221346022561193, "sensitivity": 0.5922445621209058 }, { "name": "model.layers.27.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.360869156196713e-05, "sensitivity": 0.8446105697236841 }, { "name": "model.layers.27.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.690287364108372e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007095012697391212, "sensitivity": 0.5314148658292116 }, { "name": "model.layers.27.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.289671728154644e-05, "sensitivity": 0.8603391390507547 }, { "name": "model.layers.27.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.103948173105891e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007050613639876246, "sensitivity": 0.5248433410884411 }, { "name": "model.layers.27.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007164645940065384, "sensitivity": 0.5923436166488477 }, { "name": "model.layers.27.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.874838049952814e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007372416439466178, "sensitivity": 0.581478708241838 }, { "name": "model.layers.27.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.849138688063249e-05, "sensitivity": 1.0659964264066075 }, { "name": "model.layers.27.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.753326028454467e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006446281331591308, "sensitivity": 0.5568772932167468 }, { "name": "model.layers.27.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9006350056733936e-05, "sensitivity": 0.6435032259897163 }, { "name": "model.layers.27.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.293564294741373e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006757780793122947, "sensitivity": 0.5139642741819704 }, { "name": "model.layers.27.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9676196542568505e-05, "sensitivity": 0.6621761778009396 }, { "name": "model.layers.27.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.07595518179005e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006712016183882952, "sensitivity": 0.5404049112478777 }, { "name": "model.layers.27.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006572530837729573, "sensitivity": 0.5663303489281847 }, { "name": "model.layers.27.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.00596308686363e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000651884765829891, "sensitivity": 0.522777622674848 }, { "name": "model.layers.27.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.077232344774529e-05, "sensitivity": 0.7372235884399145 }, { "name": "model.layers.27.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.66835865356552e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005989265046082437, "sensitivity": 0.520937873586018 }, { "name": "model.layers.27.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006516270223073661, "sensitivity": 0.5722470722076106 }, { "name": "model.layers.27.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.78013145463774e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006652704323641956, "sensitivity": 0.5277171724902437 }, { "name": "model.layers.27.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.292153557296842e-05, "sensitivity": 0.9125960401817063 }, { "name": "model.layers.27.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.208967645055964e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007129345322027802, "sensitivity": 0.5119475417974205 }, { "name": "model.layers.27.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.972729923087172e-05, "sensitivity": 1.048058890054307 }, { "name": "model.layers.27.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.318757747678319e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006691188318654895, "sensitivity": 0.5943031627275932 }, { "name": "model.layers.27.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.422310252673924e-05, "sensitivity": 0.6284361869446151 }, { "name": "model.layers.27.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.122141028048645e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007417702581733465, "sensitivity": 0.5461424543763086 }, { "name": "model.layers.27.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1253799129917752e-05, "sensitivity": 1.4070632954399063 }, { "name": "model.layers.27.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.031011364233564e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006810346385464072, "sensitivity": 0.5853975783394711 }, { "name": "model.layers.27.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8795223594643176e-05, "sensitivity": 0.9736073550263282 }, { "name": "model.layers.27.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.538066372741014e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00066421739757061, "sensitivity": 0.5420263302412424 }, { "name": "model.layers.27.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.805718683404848e-05, "sensitivity": 0.7099313250576189 }, { "name": "model.layers.27.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.717152357145096e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006543698254972696, "sensitivity": 0.5375193295575428 }, { "name": "model.layers.27.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.125729123596102e-05, "sensitivity": 0.7403609161363012 }, { "name": "model.layers.27.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.595724014208827e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006544270436279476, "sensitivity": 0.5501699940643386 }, { "name": "model.layers.27.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1006060958607122e-05, "sensitivity": 1.392130303156212 }, { "name": "model.layers.27.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1664914154607686e-06, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.830282316310331e-05, "sensitivity": 0.7122747572809305 }, { "name": "model.layers.27.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1211372111574747e-05, "sensitivity": 1.2197691108910969 }, { "name": "model.layers.27.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.458983191099833e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8286357671022415e-05, "sensitivity": 0.9451437107221338 }, { "name": "model.layers.27.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.614034646190703e-05, "sensitivity": 0.8422466985806579 }, { "name": "model.layers.27.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.95206278275873e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007361894240602851, "sensitivity": 0.5264628707160204 }, { "name": "model.layers.27.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.172547000460327e-05, "sensitivity": 0.9257807293254767 }, { "name": "model.layers.27.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3320975540409563e-06, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006792682106606662, "sensitivity": 0.553119752144999 }, { "name": "model.layers.27.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.479403519828338e-06, "sensitivity": 2.0970519270363943 }, { "name": "model.layers.27.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.064128221325518e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006763099227100611, "sensitivity": 0.5496228028495056 }, { "name": "model.layers.27.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7816207117866725e-05, "sensitivity": 0.6337871055569014 }, { "name": "model.layers.27.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.781809472362511e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006503866752609611, "sensitivity": 0.5549517762863696 }, { "name": "model.layers.27.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.027934068697505e-05, "sensitivity": 0.6129501885254899 }, { "name": "model.layers.27.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.778946269354492e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006879507564008236, "sensitivity": 0.5356812815037768 }, { "name": "model.layers.27.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.029051655787043e-05, "sensitivity": 1.0706407750024676 }, { "name": "model.layers.27.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.065275096669211e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006839300040155649, "sensitivity": 0.5339190356078701 }, { "name": "model.layers.27.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0295453295111656e-05, "sensitivity": 0.7335443146568597 }, { "name": "model.layers.27.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.443141723546432e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006816661916673183, "sensitivity": 0.5460800670814949 }, { "name": "model.layers.27.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.834179319208488e-05, "sensitivity": 0.7740231505244342 }, { "name": "model.layers.27.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.265693173190812e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006590489065274596, "sensitivity": 0.5030929982149938 }, { "name": "model.layers.27.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7815268519334495e-05, "sensitivity": 0.6567396142634357 }, { "name": "model.layers.27.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.534965220656886e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006578967440873384, "sensitivity": 0.5153308246690461 }, { "name": "model.layers.27.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.564966704696417e-05, "sensitivity": 0.9931195557988537 }, { "name": "model.layers.27.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.150376066216268e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006399505655281246, "sensitivity": 0.5517405155931466 }, { "name": "model.layers.27.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.842160317115486e-05, "sensitivity": 0.9321401237216101 }, { "name": "model.layers.27.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.363786155816342e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006506257341243327, "sensitivity": 0.5455580876355213 }, { "name": "model.layers.27.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1292246199445799e-05, "sensitivity": 1.2701585965846582 }, { "name": "model.layers.27.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1427478057157714e-06, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.153671711217612e-05, "sensitivity": 0.7317459702728198 }, { "name": "model.layers.27.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007406770600937307, "sensitivity": 0.5747099633201722 }, { "name": "model.layers.27.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.573866464052116e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007522301748394966, "sensitivity": 0.5810859913742512 }, { "name": "model.layers.27.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.199054066906683e-05, "sensitivity": 0.741022700835067 }, { "name": "model.layers.27.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.742003850173205e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006125321378931403, "sensitivity": 0.530466668122792 }, { "name": "model.layers.27.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1502159395604394e-05, "sensitivity": 1.4735509324971787 }, { "name": "model.layers.27.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.815812861939776e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006827967590652406, "sensitivity": 0.5333204508135629 }, { "name": "model.layers.27.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.926302037551068e-05, "sensitivity": 0.8900549183220812 }, { "name": "model.layers.27.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.560261110484134e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.820286605739966e-05, "sensitivity": 0.6871348149170888 }, { "name": "model.layers.27.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.991708530928008e-05, "sensitivity": 0.9436072957356295 }, { "name": "model.layers.27.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.703047231188975e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.012379890307784e-05, "sensitivity": 0.6313819475175239 }, { "name": "model.layers.27.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.1011320212855935e-05, "sensitivity": 0.7764919973371954 }, { "name": "model.layers.27.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.579635277783382e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0016154748154804e-05, "sensitivity": 0.6715777666901775 }, { "name": "model.layers.27.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.094970376580022e-05, "sensitivity": 0.8549986386836548 }, { "name": "model.layers.27.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6447260122731677e-06, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.047650094842538e-05, "sensitivity": 0.786721266890773 }, { "name": "model.layers.27.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.011294317431748e-05, "sensitivity": 0.8003000557510581 }, { "name": "model.layers.27.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.069556318128889e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007085083052515984, "sensitivity": 0.5338846265200456 }, { "name": "model.layers.27.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1410392289690208e-05, "sensitivity": 1.600367343713598 }, { "name": "model.layers.27.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.051226020848844e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006981290644034743, "sensitivity": 0.5155833364470346 }, { "name": "model.layers.27.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.951302591711283e-05, "sensitivity": 0.612576356416924 }, { "name": "model.layers.27.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.908679779371596e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006668507121503353, "sensitivity": 0.5275179552618658 }, { "name": "model.layers.27.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0211018889094703e-05, "sensitivity": 1.44018179834609 }, { "name": "model.layers.27.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.249236091411149e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.694985156878829e-05, "sensitivity": 0.642853422475003 }, { "name": "model.layers.27.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.523270712932572e-05, "sensitivity": 0.7531900645993648 }, { "name": "model.layers.27.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.607888387108687e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.543614290421829e-05, "sensitivity": 0.6161770366373405 }, { "name": "model.layers.27.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.482606113422662e-05, "sensitivity": 1.133363156556828 }, { "name": "model.layers.27.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.308419753826456e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000725594989489764, "sensitivity": 0.5692650309442827 }, { "name": "model.layers.27.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.150025728857145e-05, "sensitivity": 0.7206207370411886 }, { "name": "model.layers.27.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.390909099238343e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000687071995344013, "sensitivity": 0.53869119430384 }, { "name": "model.layers.27.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.989425699226558e-05, "sensitivity": 0.828870731865391 }, { "name": "model.layers.27.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.405242510889366e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006657940102741122, "sensitivity": 0.5425151787579583 }, { "name": "model.layers.27.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3830532427382423e-06, "sensitivity": 2.0972365605468912 }, { "name": "model.layers.27.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.025142296384729e-06, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.816239718114957e-05, "sensitivity": 0.6091171092510885 }, { "name": "model.layers.27.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3869087423663586e-05, "sensitivity": 0.9522800234540035 }, { "name": "model.layers.27.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.263416819114354e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006393005605787039, "sensitivity": 0.5610410816766879 }, { "name": "model.layers.27.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1341496247041505e-05, "sensitivity": 1.2471781758916425 }, { "name": "model.layers.27.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.2218118652454e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007247984176501632, "sensitivity": 0.5739509925005964 }, { "name": "model.layers.27.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.158048538258299e-05, "sensitivity": 0.8144017278924174 }, { "name": "model.layers.27.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0386789881522418e-06, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.363596523646265e-05, "sensitivity": 0.7057946130204937 }, { "name": "model.layers.27.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.73617614666e-05, "sensitivity": 1.0613630927748505 }, { "name": "model.layers.27.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.298902685055509e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.564041541423649e-05, "sensitivity": 0.8029282396972294 }, { "name": "model.layers.27.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8756821090355515e-05, "sensitivity": 1.1139750563150939 }, { "name": "model.layers.27.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.802135198493488e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006499493028968573, "sensitivity": 0.5418985066462261 }, { "name": "model.layers.27.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.183009827509522e-05, "sensitivity": 0.9981074927665802 }, { "name": "model.layers.27.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.087689250009134e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006809207843616605, "sensitivity": 0.5443896307182087 }, { "name": "model.layers.27.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.755706661147997e-05, "sensitivity": 0.8474863751121067 }, { "name": "model.layers.27.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.378040436378797e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006510355742648244, "sensitivity": 0.5611174568528803 }, { "name": "model.layers.27.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.914029316045344e-05, "sensitivity": 1.087191160402956 }, { "name": "model.layers.27.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.884197543717164e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006543115014210343, "sensitivity": 0.585416721839086 }, { "name": "model.layers.27.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006081392057240009, "sensitivity": 0.5850200563401838 }, { "name": "model.layers.27.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.162151748867473e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006300742388702929, "sensitivity": 0.5357786867747565 }, { "name": "model.layers.27.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 4.374996024125721e-06, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3550717287434964e-06, "sensitivity": 2.1006861060842814 }, { "name": "model.layers.27.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.937963684729766e-07, "sensitivity": 10.0 }, { "name": "model.layers.27.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.9620028979261406e-06, "sensitivity": 2.1039647012340463 }, { "name": "model.layers.27.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 3.422369991312735e-05, "sensitivity": 1.9512029449160893 }, { "name": "model.layers.27.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.0001760940212989226, "sensitivity": 0.8561525697563467 }, { "name": "model.layers.27.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.4316299711936153e-05, "sensitivity": 1.2497829376172984 }, { "name": "model.layers.27.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 4, "mse": 1.2362863344606012e-05, "sensitivity": 1.7385024860529614 }, { "name": "model.layers.27.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00024785325513221323, "sensitivity": 0.7570314386150334 }, { "name": "model.layers.28.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1517098755575716e-05, "sensitivity": 1.3845221120481037 }, { "name": "model.layers.28.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.235366426044493e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.300222594290972e-05, "sensitivity": 0.6171037872326194 }, { "name": "model.layers.28.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.915984365856275e-05, "sensitivity": 0.8207255057656406 }, { "name": "model.layers.28.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.474081146734534e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006657486082985997, "sensitivity": 0.5373346265949668 }, { "name": "model.layers.28.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9264675655867904e-05, "sensitivity": 0.7928243784429634 }, { "name": "model.layers.28.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.283659897439065e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006783275748603046, "sensitivity": 0.5343504565474738 }, { "name": "model.layers.28.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.089310045354068e-05, "sensitivity": 1.0112043354082088 }, { "name": "model.layers.28.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.95663857186446e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006749384920112789, "sensitivity": 0.5272141302122307 }, { "name": "model.layers.28.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8853504015132785e-05, "sensitivity": 0.767797311580168 }, { "name": "model.layers.28.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.745196626274264e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006428570486605167, "sensitivity": 0.5538698233223288 }, { "name": "model.layers.28.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.175230762688443e-05, "sensitivity": 0.6386149898445586 }, { "name": "model.layers.28.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.729024223910528e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006064579356461763, "sensitivity": 0.5448054630031786 }, { "name": "model.layers.28.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1074560461565852e-05, "sensitivity": 1.300341113594244 }, { "name": "model.layers.28.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2048066082570585e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006850849604234099, "sensitivity": 0.5792856311135804 }, { "name": "model.layers.28.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8372268540551886e-05, "sensitivity": 0.7087038090522175 }, { "name": "model.layers.28.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0485204029464512e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.873500049347058e-05, "sensitivity": 0.6929383021879858 }, { "name": "model.layers.28.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.217576446942985e-05, "sensitivity": 1.1498924725897361 }, { "name": "model.layers.28.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.902825356926769e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000722693745046854, "sensitivity": 0.5462541055587917 }, { "name": "model.layers.28.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.574763392563909e-05, "sensitivity": 0.8975571626114702 }, { "name": "model.layers.28.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0201738405157812e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.632195436395705e-05, "sensitivity": 0.6589211946951546 }, { "name": "model.layers.28.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.866717401659116e-05, "sensitivity": 0.6960977528777147 }, { "name": "model.layers.28.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.636686293859384e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006761203403584659, "sensitivity": 0.5262781665243321 }, { "name": "model.layers.28.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.750277705374174e-05, "sensitivity": 0.640724123122386 }, { "name": "model.layers.28.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.402969686154393e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006664732354693115, "sensitivity": 0.5329493765184738 }, { "name": "model.layers.28.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.147289968794212e-05, "sensitivity": 1.006274836211792 }, { "name": "model.layers.28.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.556869038831792e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.136907904874533e-05, "sensitivity": 0.6648555988683933 }, { "name": "model.layers.28.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.604357284028083e-05, "sensitivity": 1.0267485738301338 }, { "name": "model.layers.28.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.137729767237033e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006815920351073146, "sensitivity": 0.5179328404312741 }, { "name": "model.layers.28.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.983300434309058e-05, "sensitivity": 0.8836541281219474 }, { "name": "model.layers.28.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.475907063460909e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006570428377017379, "sensitivity": 0.5363534402834835 }, { "name": "model.layers.28.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.829826113767922e-05, "sensitivity": 0.8573711019697038 }, { "name": "model.layers.28.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.273864983086241e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006609940901398659, "sensitivity": 0.5274231008003196 }, { "name": "model.layers.28.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1422262105043046e-05, "sensitivity": 1.4560266423040886 }, { "name": "model.layers.28.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.436868708689872e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.065690831746906e-05, "sensitivity": 0.8180627705612841 }, { "name": "model.layers.28.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.061400563339703e-05, "sensitivity": 0.6932434192924551 }, { "name": "model.layers.28.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.611855264462065e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006937377038411796, "sensitivity": 0.5549329403697381 }, { "name": "model.layers.28.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.449253851315007e-05, "sensitivity": 0.7200468426547384 }, { "name": "model.layers.28.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.806049436316243e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007630165200680494, "sensitivity": 0.559927693429743 }, { "name": "model.layers.28.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1119393093395047e-05, "sensitivity": 1.4443114089478908 }, { "name": "model.layers.28.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.294317694890196e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006443373276852071, "sensitivity": 0.5614863768960535 }, { "name": "model.layers.28.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.802817759104073e-05, "sensitivity": 1.077268042673643 }, { "name": "model.layers.28.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.002990870802023e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00064762745751068, "sensitivity": 0.5281678749478926 }, { "name": "model.layers.28.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.890499960514717e-05, "sensitivity": 0.6339506119617764 }, { "name": "model.layers.28.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.085098670562729e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000675192684866488, "sensitivity": 0.5638026440283206 }, { "name": "model.layers.28.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8286794228479266e-05, "sensitivity": 0.6553369552194496 }, { "name": "model.layers.28.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0889137911362923e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006539142923429608, "sensitivity": 0.5440131242679858 }, { "name": "model.layers.28.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.973782390356064e-05, "sensitivity": 0.626382735990033 }, { "name": "model.layers.28.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.798655244390829e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.013415986672044e-05, "sensitivity": 0.6070579257144499 }, { "name": "model.layers.28.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0933740668406244e-05, "sensitivity": 1.3959551445713654 }, { "name": "model.layers.28.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.214106077895849e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8029108913615346e-05, "sensitivity": 0.7369832413226546 }, { "name": "model.layers.28.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006781236152164638, "sensitivity": 0.5291499154152135 }, { "name": "model.layers.28.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.736474347235344e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006878258427605033, "sensitivity": 0.5455611382991278 }, { "name": "model.layers.28.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.85953748668544e-05, "sensitivity": 0.6604650025029976 }, { "name": "model.layers.28.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.37330231256783e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006867152405902743, "sensitivity": 0.5353496565318944 }, { "name": "model.layers.28.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.808087735204026e-05, "sensitivity": 0.6195786288448822 }, { "name": "model.layers.28.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.910101658126223e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006605664966627955, "sensitivity": 0.5175739659711703 }, { "name": "model.layers.28.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.425141327781603e-05, "sensitivity": 0.8945409969839327 }, { "name": "model.layers.28.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.639427389629418e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000746148347388953, "sensitivity": 0.5394101651641264 }, { "name": "model.layers.28.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.623642573482357e-05, "sensitivity": 0.6981493970988233 }, { "name": "model.layers.28.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.729707587917801e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006425504107028246, "sensitivity": 0.5446858908352791 }, { "name": "model.layers.28.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.771667929366231e-05, "sensitivity": 1.043072170092894 }, { "name": "model.layers.28.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6778694771346636e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8086414355784655e-05, "sensitivity": 0.6336775457268262 }, { "name": "model.layers.28.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0286295946571045e-05, "sensitivity": 1.2720708364551605 }, { "name": "model.layers.28.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.124210128495179e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006483166362158954, "sensitivity": 0.5292551574166814 }, { "name": "model.layers.28.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.03829394094646e-05, "sensitivity": 0.6838314290241412 }, { "name": "model.layers.28.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.626148092436779e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006796428933739662, "sensitivity": 0.5377114467459789 }, { "name": "model.layers.28.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.983950803871267e-06, "sensitivity": 1.4171620371018916 }, { "name": "model.layers.28.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.082386789785232e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005957980174571276, "sensitivity": 0.5867069338461128 }, { "name": "model.layers.28.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007051430875435472, "sensitivity": 0.589400012276723 }, { "name": "model.layers.28.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.397487706839456e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.322187255136669e-05, "sensitivity": 0.6702334418199658 }, { "name": "model.layers.28.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.233820749912411e-05, "sensitivity": 0.6778683869009887 }, { "name": "model.layers.28.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.739389502603444e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007077637128531933, "sensitivity": 0.5376812765830634 }, { "name": "model.layers.28.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.845688039902598e-05, "sensitivity": 1.0396736290897197 }, { "name": "model.layers.28.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.030115961650154e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.143474067561328e-05, "sensitivity": 0.6248264622916615 }, { "name": "model.layers.28.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.2241477533243597e-05, "sensitivity": 0.9017219887392713 }, { "name": "model.layers.28.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.143466973502655e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006028743810020387, "sensitivity": 0.5151649229634709 }, { "name": "model.layers.28.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.246287375688553e-05, "sensitivity": 1.0064727279720493 }, { "name": "model.layers.28.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.758940571671701e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007206174777820706, "sensitivity": 0.5163782116134934 }, { "name": "model.layers.28.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.854380287928507e-05, "sensitivity": 0.9828884803775354 }, { "name": "model.layers.28.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0652006494638044e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006579567561857402, "sensitivity": 0.5639534274185943 }, { "name": "model.layers.28.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9275596868246794e-05, "sensitivity": 0.9987528851731046 }, { "name": "model.layers.28.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.778033707632858e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006891472148708999, "sensitivity": 0.5912340531527924 }, { "name": "model.layers.28.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8089877711609006e-05, "sensitivity": 1.0893866229993694 }, { "name": "model.layers.28.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.290603096203995e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.933266947977245e-05, "sensitivity": 0.6131824993769073 }, { "name": "model.layers.28.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.7811854579340434e-06, "sensitivity": 2.0978541064883722 }, { "name": "model.layers.28.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6521771613042802e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.854350067442283e-05, "sensitivity": 0.7121417744227643 }, { "name": "model.layers.28.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0931343240372371e-05, "sensitivity": 1.458821667791365 }, { "name": "model.layers.28.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.31569082038186e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006785143632441759, "sensitivity": 0.5437391006811213 }, { "name": "model.layers.28.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.470739026553929e-05, "sensitivity": 0.9324797120502207 }, { "name": "model.layers.28.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1568572517717257e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007516397163271904, "sensitivity": 0.5587344518079542 }, { "name": "model.layers.28.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.044458132237196e-05, "sensitivity": 1.065522808238687 }, { "name": "model.layers.28.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.495884233321704e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.964516822132282e-05, "sensitivity": 0.6450792591913838 }, { "name": "model.layers.28.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.279005174292251e-05, "sensitivity": 0.6404639296635584 }, { "name": "model.layers.28.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.020678023967776e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007180289831012487, "sensitivity": 0.5240334219414674 }, { "name": "model.layers.28.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.884558049729094e-05, "sensitivity": 0.9194892912211226 }, { "name": "model.layers.28.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3318931451067328e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.72594981349539e-05, "sensitivity": 0.6520209732223019 }, { "name": "model.layers.28.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007133157923817635, "sensitivity": 0.5652289004274336 }, { "name": "model.layers.28.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.978086955517938e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007206270820461214, "sensitivity": 0.5349936654473556 }, { "name": "model.layers.28.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.289721204666421e-05, "sensitivity": 1.0604471067032206 }, { "name": "model.layers.28.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2000239166809479e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.19155471213162e-05, "sensitivity": 0.7886211558309308 }, { "name": "model.layers.28.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006505344063043594, "sensitivity": 0.5559563699226795 }, { "name": "model.layers.28.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.961429335206049e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006614547455683351, "sensitivity": 0.5372441272969999 }, { "name": "model.layers.28.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4428994189947844e-05, "sensitivity": 0.9322809397296452 }, { "name": "model.layers.28.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.276102340052603e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.715392035199329e-05, "sensitivity": 0.6370349331749222 }, { "name": "model.layers.28.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.571246922248974e-05, "sensitivity": 0.7936023131855989 }, { "name": "model.layers.28.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.35572258841421e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007760361768305302, "sensitivity": 0.5994543032267188 }, { "name": "model.layers.28.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.421526657301001e-05, "sensitivity": 0.6068380256072244 }, { "name": "model.layers.28.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.027148629073054e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006373185315169394, "sensitivity": 0.5458608971655083 }, { "name": "model.layers.28.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.127447704784572e-05, "sensitivity": 0.888038785071647 }, { "name": "model.layers.28.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.456365776510211e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000687946449033916, "sensitivity": 0.5528346957227531 }, { "name": "model.layers.28.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.663709816872142e-05, "sensitivity": 0.659516305615286 }, { "name": "model.layers.28.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.517793735838495e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006496310234069824, "sensitivity": 0.5702099881270537 }, { "name": "model.layers.28.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.308791489573196e-05, "sensitivity": 0.7912834917742791 }, { "name": "model.layers.28.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0568131756372168e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007095853798091412, "sensitivity": 0.5506845417297036 }, { "name": "model.layers.28.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.178260082378983e-05, "sensitivity": 0.7220366704862622 }, { "name": "model.layers.28.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.263172048827983e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007009397959336638, "sensitivity": 0.5180845050300533 }, { "name": "model.layers.28.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.927733946009539e-05, "sensitivity": 0.6857538373807325 }, { "name": "model.layers.28.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0973456028295914e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006766663282178342, "sensitivity": 0.5318873486268223 }, { "name": "model.layers.28.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.526322977151722e-05, "sensitivity": 0.9809919719862861 }, { "name": "model.layers.28.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.632684966869419e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.56214397167787e-05, "sensitivity": 0.693782698302144 }, { "name": "model.layers.28.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.157565076136962e-05, "sensitivity": 0.6108976481196985 }, { "name": "model.layers.28.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.39800009089231e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006914960104040802, "sensitivity": 0.5410978766304497 }, { "name": "model.layers.28.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3124076657695696e-05, "sensitivity": 0.7632922041735228 }, { "name": "model.layers.28.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.212451353349024e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006113330600783229, "sensitivity": 0.5443667527144924 }, { "name": "model.layers.28.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.783961387351155e-05, "sensitivity": 0.9927341750697767 }, { "name": "model.layers.28.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.475303729937878e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006453141686506569, "sensitivity": 0.5253810678740389 }, { "name": "model.layers.28.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.567068339791149e-05, "sensitivity": 0.8070947229489885 }, { "name": "model.layers.28.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.325666271957743e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007650158368051052, "sensitivity": 0.548946497516127 }, { "name": "model.layers.28.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 4.076369350514142e-06, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3591956050950103e-06, "sensitivity": 2.1013863793855396 }, { "name": "model.layers.28.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.214302968350239e-07, "sensitivity": 10.0 }, { "name": "model.layers.28.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.926277491293149e-06, "sensitivity": 2.105096517925529 }, { "name": "model.layers.28.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 9.340635187982116e-06, "sensitivity": 2.214850930883572 }, { "name": "model.layers.28.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.0002082700520986691, "sensitivity": 0.8735159737834655 }, { "name": "model.layers.28.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.5722242096671835e-05, "sensitivity": 1.2867135701127401 }, { "name": "model.layers.28.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 2, "mse": 0.0006687938002869487, "sensitivity": 0.5640842856143823 }, { "name": "model.layers.28.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0003138853353448212, "sensitivity": 1.1068699345194186 }, { "name": "model.layers.29.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.2202923244331032e-05, "sensitivity": 1.2428196903957014 }, { "name": "model.layers.29.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.793938622540736e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.709701847285032e-05, "sensitivity": 0.7661643064086392 }, { "name": "model.layers.29.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8579746109899133e-05, "sensitivity": 0.8625076854763248 }, { "name": "model.layers.29.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.088291908985411e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006722623365931213, "sensitivity": 0.5861116375587321 }, { "name": "model.layers.29.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6195727665908635e-05, "sensitivity": 0.7857206036264581 }, { "name": "model.layers.29.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.056473805278074e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006662987871095538, "sensitivity": 0.5242402240112217 }, { "name": "model.layers.29.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.298573134699836e-05, "sensitivity": 0.7941621586085202 }, { "name": "model.layers.29.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.027045848597481e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000718500348739326, "sensitivity": 0.5398256409695666 }, { "name": "model.layers.29.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.997763219056651e-05, "sensitivity": 0.9422023574309845 }, { "name": "model.layers.29.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.827529202586447e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006820994894951582, "sensitivity": 0.5156950746868437 }, { "name": "model.layers.29.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7777429901761934e-05, "sensitivity": 0.8031297770775302 }, { "name": "model.layers.29.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.349869974859757e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006921006715856493, "sensitivity": 0.5894159202616576 }, { "name": "model.layers.29.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006293547339737415, "sensitivity": 0.5767885804903992 }, { "name": "model.layers.29.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.029985908957315e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006501083262264729, "sensitivity": 0.5222201841215119 }, { "name": "model.layers.29.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0422586456115823e-05, "sensitivity": 1.8262739473891656 }, { "name": "model.layers.29.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.732021802235977e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.092646799515933e-05, "sensitivity": 0.6801860364973717 }, { "name": "model.layers.29.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.57519742869772e-05, "sensitivity": 0.9318497535566537 }, { "name": "model.layers.29.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.853702186366718e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006657260237261653, "sensitivity": 0.5008463755297006 }, { "name": "model.layers.29.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0431641385366675e-05, "sensitivity": 1.2564126978783483 }, { "name": "model.layers.29.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.282388535008067e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006376872770488262, "sensitivity": 0.5781821326730185 }, { "name": "model.layers.29.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.232323847943917e-05, "sensitivity": 1.23222239596985 }, { "name": "model.layers.29.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0076587386720348e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007745804032310843, "sensitivity": 0.5231661935098895 }, { "name": "model.layers.29.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1087429811595939e-05, "sensitivity": 1.3052851872857085 }, { "name": "model.layers.29.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.89092950981285e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006961814360693097, "sensitivity": 0.568521998607951 }, { "name": "model.layers.29.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.789749411633238e-05, "sensitivity": 1.1862038067853358 }, { "name": "model.layers.29.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0700545090003288e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006612049182876945, "sensitivity": 0.5740127970590566 }, { "name": "model.layers.29.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1066964361816645e-05, "sensitivity": 1.8996516360439744 }, { "name": "model.layers.29.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.110686854299274e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006680000806227326, "sensitivity": 0.5398895505502513 }, { "name": "model.layers.29.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.989139754092321e-05, "sensitivity": 1.153840678749005 }, { "name": "model.layers.29.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.973207516442926e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006780295516364276, "sensitivity": 0.5714887544583714 }, { "name": "model.layers.29.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006712726317346096, "sensitivity": 0.5677780107920719 }, { "name": "model.layers.29.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.489924200854148e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006913216784596443, "sensitivity": 0.5340704240354985 }, { "name": "model.layers.29.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9222507843514904e-05, "sensitivity": 0.649827532947755 }, { "name": "model.layers.29.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.931711252240348e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000686544575728476, "sensitivity": 0.588246013381343 }, { "name": "model.layers.29.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007178501691669226, "sensitivity": 0.5877178282840966 }, { "name": "model.layers.29.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.079519832586811e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007223798893392086, "sensitivity": 0.5625320938861073 }, { "name": "model.layers.29.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1012469258275814e-05, "sensitivity": 1.4571201852828575 }, { "name": "model.layers.29.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.967941317270743e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.108960951678455e-05, "sensitivity": 0.6055201292619797 }, { "name": "model.layers.29.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.926140147494152e-05, "sensitivity": 1.0577604404584524 }, { "name": "model.layers.29.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.906323844508734e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006800724077038467, "sensitivity": 0.525615337943894 }, { "name": "model.layers.29.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.233587919268757e-05, "sensitivity": 0.9036201411088436 }, { "name": "model.layers.29.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.834031177684665e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006956764264032245, "sensitivity": 0.5367365210087323 }, { "name": "model.layers.29.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.133883289294317e-05, "sensitivity": 1.1063866674393905 }, { "name": "model.layers.29.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.647083061281592e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.078482692828402e-05, "sensitivity": 0.7385075662368118 }, { "name": "model.layers.29.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.430511712096632e-05, "sensitivity": 1.1155245392844504 }, { "name": "model.layers.29.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.49173239000811e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007354483823291957, "sensitivity": 0.5371326534003364 }, { "name": "model.layers.29.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7947789173340425e-05, "sensitivity": 0.6919189512275715 }, { "name": "model.layers.29.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.879747616039822e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000661009456962347, "sensitivity": 0.5075702350296191 }, { "name": "model.layers.29.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006237146444618702, "sensitivity": 0.5660342879166813 }, { "name": "model.layers.29.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.175422413434717e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006687139975838363, "sensitivity": 0.5737755669729333 }, { "name": "model.layers.29.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.566625961568207e-05, "sensitivity": 0.796951613502413 }, { "name": "model.layers.29.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0353799098083982e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007504690438508987, "sensitivity": 0.5375219017448513 }, { "name": "model.layers.29.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9802037867484614e-05, "sensitivity": 0.6798338137765498 }, { "name": "model.layers.29.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.311515790002886e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006779401446692646, "sensitivity": 0.5254973802199494 }, { "name": "model.layers.29.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.283110997173935e-05, "sensitivity": 0.795784823259125 }, { "name": "model.layers.29.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4023775065652444e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007018701871857047, "sensitivity": 0.5457532178411342 }, { "name": "model.layers.29.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6196404329966754e-05, "sensitivity": 1.077523618590845 }, { "name": "model.layers.29.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.569138122358709e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006603479268960655, "sensitivity": 0.5695466827858201 }, { "name": "model.layers.29.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0752041816886049e-05, "sensitivity": 1.438171971506604 }, { "name": "model.layers.29.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.768734798853984e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7757853937800974e-05, "sensitivity": 0.6028970442222918 }, { "name": "model.layers.29.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.138226308394223e-05, "sensitivity": 0.8964289761600084 }, { "name": "model.layers.29.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.901593784888973e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000711970729753375, "sensitivity": 0.5863898417525213 }, { "name": "model.layers.29.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0421465958643239e-05, "sensitivity": 1.3297568669006965 }, { "name": "model.layers.29.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.504629249728168e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006424713646993041, "sensitivity": 0.5797313588826508 }, { "name": "model.layers.29.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.034183024894446e-05, "sensitivity": 0.7551102994747794 }, { "name": "model.layers.29.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.961083383634104e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006856407853774726, "sensitivity": 0.5857623295934988 }, { "name": "model.layers.29.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.09804701525718e-05, "sensitivity": 0.9258250507563723 }, { "name": "model.layers.29.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.989495773268573e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000705176149494946, "sensitivity": 0.5613614368827883 }, { "name": "model.layers.29.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.198450864758343e-05, "sensitivity": 0.6375846212817792 }, { "name": "model.layers.29.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.739246825622104e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007079929928295314, "sensitivity": 0.5326762379515698 }, { "name": "model.layers.29.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.163555498351343e-05, "sensitivity": 1.230595093148923 }, { "name": "model.layers.29.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.94154333966435e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.411809590645134e-05, "sensitivity": 0.805587051807257 }, { "name": "model.layers.29.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1243765584367793e-05, "sensitivity": 1.241634105147677 }, { "name": "model.layers.29.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.475347842955671e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006898852298036218, "sensitivity": 0.5839526989530381 }, { "name": "model.layers.29.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1175480722158682e-05, "sensitivity": 1.3589498417227364 }, { "name": "model.layers.29.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0268778396493872e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.128239328972995e-05, "sensitivity": 1.0226825999244105 }, { "name": "model.layers.29.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.3500389286491554e-05, "sensitivity": 1.2856436479466968 }, { "name": "model.layers.29.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0672217740648193e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.817922596586868e-05, "sensitivity": 0.735424878448092 }, { "name": "model.layers.29.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8055913541466e-05, "sensitivity": 0.6472351196485872 }, { "name": "model.layers.29.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.810197300590517e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006911588134244084, "sensitivity": 0.539744523902177 }, { "name": "model.layers.29.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1501897461130284e-05, "sensitivity": 1.6607179458976082 }, { "name": "model.layers.29.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.891829222397064e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.287913856795058e-05, "sensitivity": 0.7105980994435643 }, { "name": "model.layers.29.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8686156990006566e-05, "sensitivity": 0.6456902895304898 }, { "name": "model.layers.29.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.825528882676736e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006794440560042858, "sensitivity": 0.521410162012892 }, { "name": "model.layers.29.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7550765632186085e-05, "sensitivity": 0.9266006562597509 }, { "name": "model.layers.29.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.680682756472379e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006679994985461235, "sensitivity": 0.5045260072667561 }, { "name": "model.layers.29.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.96625468460843e-05, "sensitivity": 1.127357061817252 }, { "name": "model.layers.29.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.079819278667856e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006761566619388759, "sensitivity": 0.5431194106430701 }, { "name": "model.layers.29.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.376586679834872e-05, "sensitivity": 0.6759466703952788 }, { "name": "model.layers.29.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.266098916465126e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.42963859718293e-05, "sensitivity": 0.6660097341938759 }, { "name": "model.layers.29.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0922470210061874e-05, "sensitivity": 1.7621816466696123 }, { "name": "model.layers.29.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.929210141810472e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00067975337151438, "sensitivity": 0.5844808968714085 }, { "name": "model.layers.29.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.343980930978432e-05, "sensitivity": 1.083174489513817 }, { "name": "model.layers.29.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1778834050346632e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007397168083116412, "sensitivity": 0.5205947016472083 }, { "name": "model.layers.29.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8955163694918156e-05, "sensitivity": 0.9503366381029716 }, { "name": "model.layers.29.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.689407877682243e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006602643406949937, "sensitivity": 0.5558265280590873 }, { "name": "model.layers.29.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.923423304921016e-05, "sensitivity": 0.7318780769070845 }, { "name": "model.layers.29.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.675053896287864e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006760814576409757, "sensitivity": 0.5222850768586121 }, { "name": "model.layers.29.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.198509072419256e-05, "sensitivity": 1.0467227833139205 }, { "name": "model.layers.29.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0941247410301003e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.359622057061642e-05, "sensitivity": 0.6696242068648006 }, { "name": "model.layers.29.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.422137473942712e-05, "sensitivity": 0.9215037161725961 }, { "name": "model.layers.29.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.293425940384623e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006459978758357465, "sensitivity": 0.5589603451073145 }, { "name": "model.layers.29.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.876378756714985e-05, "sensitivity": 0.8206796680977609 }, { "name": "model.layers.29.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.695794460640172e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007909519481472671, "sensitivity": 0.5592413850257201 }, { "name": "model.layers.29.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.260158988879994e-05, "sensitivity": 0.8584946706150576 }, { "name": "model.layers.29.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.556765808658383e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007190449978224933, "sensitivity": 0.5270427544447248 }, { "name": "model.layers.29.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.188862607814372e-05, "sensitivity": 0.8598400868669094 }, { "name": "model.layers.29.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.433704922732431e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007041522767394781, "sensitivity": 0.5939115945707742 }, { "name": "model.layers.29.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1699459719238803e-05, "sensitivity": 1.351683140597715 }, { "name": "model.layers.29.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0357935025240295e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.420719728339463e-05, "sensitivity": 0.6220629446744618 }, { "name": "model.layers.29.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0798736184369773e-05, "sensitivity": 1.2822720815714983 }, { "name": "model.layers.29.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.989412438291765e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.880851676920429e-05, "sensitivity": 0.6410048427064311 }, { "name": "model.layers.29.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.028365169186145e-05, "sensitivity": 1.1083570109043792 }, { "name": "model.layers.29.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.531968660463463e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006908149225637317, "sensitivity": 0.5345563651933907 }, { "name": "model.layers.29.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.265808431431651e-05, "sensitivity": 1.0788281190084836 }, { "name": "model.layers.29.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0629898952174699e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.459458043333143e-05, "sensitivity": 0.7556311788148847 }, { "name": "model.layers.29.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.83390865358524e-05, "sensitivity": 1.0535404893695808 }, { "name": "model.layers.29.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0908049716817914e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.879052332602441e-05, "sensitivity": 0.7183428750320041 }, { "name": "model.layers.29.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0993431715178303e-05, "sensitivity": 1.2326023219237154 }, { "name": "model.layers.29.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.711209258966846e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000676387338899076, "sensitivity": 0.5116077436750265 }, { "name": "model.layers.29.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.432647205656394e-05, "sensitivity": 1.0017480219088917 }, { "name": "model.layers.29.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.376708595074888e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007347021019086242, "sensitivity": 0.5224913083325531 }, { "name": "model.layers.29.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1400333278288599e-05, "sensitivity": 1.5576240295820754 }, { "name": "model.layers.29.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.995477406235295e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006943045882508159, "sensitivity": 0.5048246666250034 }, { "name": "model.layers.29.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.011391476728022e-05, "sensitivity": 1.183016337614897 }, { "name": "model.layers.29.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.692517106581363e-07, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006028522620908916, "sensitivity": 0.5095738504080318 }, { "name": "model.layers.29.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8794597862288356e-05, "sensitivity": 0.9245617575536266 }, { "name": "model.layers.29.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1629790606093593e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006719491793774068, "sensitivity": 0.5295724505497401 }, { "name": "model.layers.29.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 3.8845482777105644e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.589534688013373e-06, "sensitivity": 2.102444515648742 }, { "name": "model.layers.29.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0225389814877417e-06, "sensitivity": 10.0 }, { "name": "model.layers.29.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 8.044953574426472e-06, "sensitivity": 1.9103508405580032 }, { "name": "model.layers.29.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 9.417742148798425e-06, "sensitivity": 2.055706685766689 }, { "name": "model.layers.29.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.000219018169445917, "sensitivity": 0.8624596053524523 }, { "name": "model.layers.29.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.5322419130825438e-05, "sensitivity": 1.052707068247565 }, { "name": "model.layers.29.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.8257497585145757e-05, "sensitivity": 0.6497595872171725 }, { "name": "model.layers.29.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0003324975841678679, "sensitivity": 0.7475651932465758 }, { "name": "model.layers.30.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.015154576743953e-05, "sensitivity": 0.7426248567302006 }, { "name": "model.layers.30.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.708102197691915e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006990457768552005, "sensitivity": 0.570338974266182 }, { "name": "model.layers.30.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0257415851810947e-05, "sensitivity": 1.341510098576097 }, { "name": "model.layers.30.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4229308362700976e-06, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006257821805775166, "sensitivity": 0.557440358996066 }, { "name": "model.layers.30.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.416493316559354e-06, "sensitivity": 2.068032270043641 }, { "name": "model.layers.30.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.421631380566396e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006835166714154184, "sensitivity": 0.5369512121082289 }, { "name": "model.layers.30.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.968460027361289e-05, "sensitivity": 0.6299516066963418 }, { "name": "model.layers.30.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.458995128217794e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006997189484536648, "sensitivity": 0.5421818028623373 }, { "name": "model.layers.30.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006527408841066062, "sensitivity": 0.5457427932893928 }, { "name": "model.layers.30.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.343693712551612e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000652086571790278, "sensitivity": 0.5183539764359181 }, { "name": "model.layers.30.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006958710728213191, "sensitivity": 0.5268857457250861 }, { "name": "model.layers.30.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.23251218914811e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007068949053063989, "sensitivity": 0.5297693285126956 }, { "name": "model.layers.30.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.775525642093271e-05, "sensitivity": 0.6459913728286961 }, { "name": "model.layers.30.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.636366490260116e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006463612662628293, "sensitivity": 0.5280918235111568 }, { "name": "model.layers.30.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.2382281864993274e-05, "sensitivity": 0.730148379891373 }, { "name": "model.layers.30.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.969402536720736e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006135470466688275, "sensitivity": 0.5375751724808642 }, { "name": "model.layers.30.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.635462341364473e-05, "sensitivity": 0.6607404951264891 }, { "name": "model.layers.30.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.353126984024129e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007420014590024948, "sensitivity": 0.5805494042852634 }, { "name": "model.layers.30.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.411562945781043e-06, "sensitivity": 2.097195952399568 }, { "name": "model.layers.30.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1588028883124935e-06, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.18297272012569e-05, "sensitivity": 0.7682464693916097 }, { "name": "model.layers.30.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0808637499576434e-05, "sensitivity": 0.7145488850709897 }, { "name": "model.layers.30.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.111655122571392e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006838343106210232, "sensitivity": 0.5822331405121125 }, { "name": "model.layers.30.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006563186179846525, "sensitivity": 0.5312036906048698 }, { "name": "model.layers.30.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.58748569751333e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006964618805795908, "sensitivity": 0.5298753878260306 }, { "name": "model.layers.30.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006754223140887916, "sensitivity": 0.5156401130429054 }, { "name": "model.layers.30.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.447945336025441e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006823883741162717, "sensitivity": 0.5107908400844566 }, { "name": "model.layers.30.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006073982222005725, "sensitivity": 0.5254207564720779 }, { "name": "model.layers.30.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.274547104112571e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006089885719120502, "sensitivity": 0.5631131213536003 }, { "name": "model.layers.30.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006655773613601923, "sensitivity": 0.555978133400762 }, { "name": "model.layers.30.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.66364451010304e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006464900798164308, "sensitivity": 0.5394717314773105 }, { "name": "model.layers.30.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.25215470790863e-05, "sensitivity": 0.8981661383305738 }, { "name": "model.layers.30.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.160312401945703e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007082045776769519, "sensitivity": 0.5297602055596318 }, { "name": "model.layers.30.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.308461161097512e-05, "sensitivity": 0.8069084378586999 }, { "name": "model.layers.30.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.778459464840125e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007002949714660645, "sensitivity": 0.5352083518415255 }, { "name": "model.layers.30.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.609127038042061e-05, "sensitivity": 0.986270045721959 }, { "name": "model.layers.30.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2706118468486238e-06, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006351824849843979, "sensitivity": 0.5286329893672858 }, { "name": "model.layers.30.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.066116475267336e-05, "sensitivity": 0.6218357283518234 }, { "name": "model.layers.30.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.527363325403712e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006956635043025017, "sensitivity": 0.5063376454329676 }, { "name": "model.layers.30.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006834025261923671, "sensitivity": 0.532428491987421 }, { "name": "model.layers.30.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.93891479386366e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006704911356791854, "sensitivity": 0.5246352978118395 }, { "name": "model.layers.30.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.699572259094566e-05, "sensitivity": 0.7592780785958149 }, { "name": "model.layers.30.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.041525004249706e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008001071400940418, "sensitivity": 0.5201011674764794 }, { "name": "model.layers.30.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.042468885425478e-05, "sensitivity": 0.6490340403344277 }, { "name": "model.layers.30.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1952124623348936e-06, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006754541536793113, "sensitivity": 0.5893423985990394 }, { "name": "model.layers.30.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007010068511590362, "sensitivity": 0.5273114252977092 }, { "name": "model.layers.30.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.999040351729491e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007172173354774714, "sensitivity": 0.5270306134711955 }, { "name": "model.layers.30.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.67907006572932e-05, "sensitivity": 0.6118122355639802 }, { "name": "model.layers.30.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.126656894091866e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007512892480008304, "sensitivity": 0.5399264717840342 }, { "name": "model.layers.30.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.008451964589767e-05, "sensitivity": 0.8854572099077197 }, { "name": "model.layers.30.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.219863272846851e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000699728901963681, "sensitivity": 0.5180591156333413 }, { "name": "model.layers.30.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006918796570971608, "sensitivity": 0.5580297169804179 }, { "name": "model.layers.30.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.048790505199577e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006738638039678335, "sensitivity": 0.5185833491562031 }, { "name": "model.layers.30.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.27662957413122e-05, "sensitivity": 1.0814659311030466 }, { "name": "model.layers.30.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.413457746632048e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007094471948221326, "sensitivity": 0.5640582882641668 }, { "name": "model.layers.30.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0162171747651882e-05, "sensitivity": 1.218976329322489 }, { "name": "model.layers.30.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.677605822209443e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.799374412163161e-05, "sensitivity": 0.619416337755879 }, { "name": "model.layers.30.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8360510593047366e-05, "sensitivity": 1.1677657418330314 }, { "name": "model.layers.30.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.812866786276572e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006855240790173411, "sensitivity": 0.5160652001522761 }, { "name": "model.layers.30.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.099830352468416e-05, "sensitivity": 0.9548676359623324 }, { "name": "model.layers.30.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.200710696342867e-06, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.188444967847317e-05, "sensitivity": 0.6023869635624379 }, { "name": "model.layers.30.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.634227636619471e-05, "sensitivity": 0.733555979292331 }, { "name": "model.layers.30.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.315488801395986e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6012584536802024e-05, "sensitivity": 0.6359785545623443 }, { "name": "model.layers.30.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.044408418238163e-05, "sensitivity": 1.2033294355967934 }, { "name": "model.layers.30.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.308987963166146e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006480125593952835, "sensitivity": 0.5548057581737598 }, { "name": "model.layers.30.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.284918345045298e-05, "sensitivity": 0.6717903528204221 }, { "name": "model.layers.30.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.661486390337814e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000710463966242969, "sensitivity": 0.5555197050832431 }, { "name": "model.layers.30.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.311116077180486e-06, "sensitivity": 2.0969564656731934 }, { "name": "model.layers.30.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0233148941551917e-06, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.632851389236748e-05, "sensitivity": 0.630907247094808 }, { "name": "model.layers.30.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.033224053680897e-05, "sensitivity": 0.6442301639298704 }, { "name": "model.layers.30.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.342804337895359e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006754806963726878, "sensitivity": 0.5561440616800098 }, { "name": "model.layers.30.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007118529174476862, "sensitivity": 0.5422963772813969 }, { "name": "model.layers.30.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.256641876869253e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007107066339813173, "sensitivity": 0.5588908812659912 }, { "name": "model.layers.30.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.225402466952801e-05, "sensitivity": 0.7906861539903387 }, { "name": "model.layers.30.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.479971711494727e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.446888437494636e-05, "sensitivity": 0.6032756506953696 }, { "name": "model.layers.30.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0619626310653985e-05, "sensitivity": 0.6361755813530433 }, { "name": "model.layers.30.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.904165724743507e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000665870844386518, "sensitivity": 0.553426458133951 }, { "name": "model.layers.30.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0791539352794643e-05, "sensitivity": 1.6829568291601338 }, { "name": "model.layers.30.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.070061312537291e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006561347981914878, "sensitivity": 0.5469639422869249 }, { "name": "model.layers.30.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1938354873564094e-05, "sensitivity": 1.3713120082585726 }, { "name": "model.layers.30.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.141029752550821e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007126179407350719, "sensitivity": 0.541734676034441 }, { "name": "model.layers.30.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006823695148341358, "sensitivity": 0.5242518275347718 }, { "name": "model.layers.30.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.346495405930909e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006622931687161326, "sensitivity": 0.5347347814650977 }, { "name": "model.layers.30.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0005722594214603305, "sensitivity": 0.5160303290752728 }, { "name": "model.layers.30.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.777962428510364e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006014804821461439, "sensitivity": 0.5754627319974269 }, { "name": "model.layers.30.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.832753231516108e-05, "sensitivity": 0.6650601408621338 }, { "name": "model.layers.30.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.423597819273709e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006914226105436683, "sensitivity": 0.5302615652543387 }, { "name": "model.layers.30.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006521005998365581, "sensitivity": 0.5416308612017834 }, { "name": "model.layers.30.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.785887194382667e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006727149593643844, "sensitivity": 0.5354997677898555 }, { "name": "model.layers.30.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.51544944755733e-05, "sensitivity": 0.636079790850619 }, { "name": "model.layers.30.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.472079689956445e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006613274454139173, "sensitivity": 0.507410377369462 }, { "name": "model.layers.30.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006492552347481251, "sensitivity": 0.5308803764242738 }, { "name": "model.layers.30.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.755552703907597e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006690435111522675, "sensitivity": 0.5411096740341178 }, { "name": "model.layers.30.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.460402356518898e-06, "sensitivity": 2.0200801708431744 }, { "name": "model.layers.30.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.79949959400983e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000674651877488941, "sensitivity": 0.5680931246618184 }, { "name": "model.layers.30.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.299297092482448e-05, "sensitivity": 0.8867253477220367 }, { "name": "model.layers.30.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.157261734391795e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007330344524234533, "sensitivity": 0.560721048773979 }, { "name": "model.layers.30.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.222270894795656e-05, "sensitivity": 0.7954661401723553 }, { "name": "model.layers.30.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.009703265088319e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006806800956837833, "sensitivity": 0.5455696565941418 }, { "name": "model.layers.30.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.974786472506821e-05, "sensitivity": 0.6723743552272199 }, { "name": "model.layers.30.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.445172514053411e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007063198718242347, "sensitivity": 0.5576978653888438 }, { "name": "model.layers.30.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5851429351605475e-05, "sensitivity": 0.7364756085932235 }, { "name": "model.layers.30.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.620248538842134e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.893485649721697e-05, "sensitivity": 0.8522049513356869 }, { "name": "model.layers.30.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.370234041241929e-05, "sensitivity": 0.6197783540478244 }, { "name": "model.layers.30.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.212435662040662e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007217250531539321, "sensitivity": 0.5321019213411731 }, { "name": "model.layers.30.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000654602306894958, "sensitivity": 0.530465275731082 }, { "name": "model.layers.30.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.233106427724124e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006613265722990036, "sensitivity": 0.5222997290923046 }, { "name": "model.layers.30.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0877035139128566e-05, "sensitivity": 0.7457574150362853 }, { "name": "model.layers.30.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.526483270543395e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006738962838426232, "sensitivity": 0.534732496544086 }, { "name": "model.layers.30.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006636708858422935, "sensitivity": 0.5195797426537276 }, { "name": "model.layers.30.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.641471029273816e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006632024305872619, "sensitivity": 0.5196129123776887 }, { "name": "model.layers.30.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9599551605060697e-05, "sensitivity": 1.0057646697736238 }, { "name": "model.layers.30.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.830584986048052e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006895669503137469, "sensitivity": 0.5602400107011698 }, { "name": "model.layers.30.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.854888488305733e-05, "sensitivity": 0.8415411470399301 }, { "name": "model.layers.30.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.822599622566486e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008085812442004681, "sensitivity": 0.5280799334258095 }, { "name": "model.layers.30.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006746994331479073, "sensitivity": 0.5898004915216961 }, { "name": "model.layers.30.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.446526524290675e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006855802494101226, "sensitivity": 0.5336895431191634 }, { "name": "model.layers.30.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.2129424248996656e-05, "sensitivity": 1.6884000705170799 }, { "name": "model.layers.30.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0735639079939574e-06, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007837393786758184, "sensitivity": 0.5348358995309848 }, { "name": "model.layers.30.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006310338503681123, "sensitivity": 0.5762165648324461 }, { "name": "model.layers.30.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.931494110380299e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006336253136396408, "sensitivity": 0.5339243528805794 }, { "name": "model.layers.30.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.347291491692886e-05, "sensitivity": 0.7781287257797715 }, { "name": "model.layers.30.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0433032002765685e-06, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000784137926530093, "sensitivity": 0.562086903939062 }, { "name": "model.layers.30.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006617470644414425, "sensitivity": 0.575948489812812 }, { "name": "model.layers.30.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.942205115796241e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006689120782539248, "sensitivity": 0.5317671789060421 }, { "name": "model.layers.30.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.072557152947411e-05, "sensitivity": 0.7557548082297848 }, { "name": "model.layers.30.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.698338665955816e-07, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007093813037499785, "sensitivity": 0.5447646745469671 }, { "name": "model.layers.30.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1320262274239212e-05, "sensitivity": 1.4163730000425874 }, { "name": "model.layers.30.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0273743100697175e-06, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0776026657549664e-05, "sensitivity": 0.8746320371225154 }, { "name": "model.layers.30.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 3.4489867175580002e-06, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.299735342603526e-06, "sensitivity": 2.1024977629783432 }, { "name": "model.layers.30.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2669231637119083e-06, "sensitivity": 10.0 }, { "name": "model.layers.30.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.929786321852589e-06, "sensitivity": 2.106870270311985 }, { "name": "model.layers.30.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 3.6172932595945895e-05, "sensitivity": 1.9474194293608793 }, { "name": "model.layers.30.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00020695090643130243, "sensitivity": 0.9157667066935129 }, { "name": "model.layers.30.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.4540173651766963e-05, "sensitivity": 1.0612963919674225 }, { "name": "model.layers.30.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.5201999202836305e-05, "sensitivity": 0.6605952275194953 }, { "name": "model.layers.30.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0003148860123474151, "sensitivity": 0.7093501681741063 }, { "name": "model.layers.31.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8468263887334615e-05, "sensitivity": 0.7704368753166795 }, { "name": "model.layers.31.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.081580856218352e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006674011237919331, "sensitivity": 0.5529444141700486 }, { "name": "model.layers.31.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.511792889796197e-05, "sensitivity": 0.6415341005553679 }, { "name": "model.layers.31.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.7204504123074e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007301999139599502, "sensitivity": 0.5286666147702828 }, { "name": "model.layers.31.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.619533476419747e-05, "sensitivity": 0.8940571967045164 }, { "name": "model.layers.31.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.339020496350713e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006201354553923011, "sensitivity": 0.5290649406384328 }, { "name": "model.layers.31.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.349934119498357e-05, "sensitivity": 0.6277061001064559 }, { "name": "model.layers.31.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.017706593615003e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007138755172491074, "sensitivity": 0.5469204769421583 }, { "name": "model.layers.31.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.684990173904225e-05, "sensitivity": 1.1979168465733443 }, { "name": "model.layers.31.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1360696134943282e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.610445441561751e-05, "sensitivity": 1.0133012421606187 }, { "name": "model.layers.31.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.827905599493533e-05, "sensitivity": 0.6365132678327916 }, { "name": "model.layers.31.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.839330914473976e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007780664600431919, "sensitivity": 0.5254554889456059 }, { "name": "model.layers.31.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.177544128149748e-05, "sensitivity": 0.652042736836698 }, { "name": "model.layers.31.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.562518587496015e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006849101046100259, "sensitivity": 0.5229993940747226 }, { "name": "model.layers.31.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8996094594476745e-05, "sensitivity": 0.9001274458719446 }, { "name": "model.layers.31.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.080515729285253e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006580407498404384, "sensitivity": 0.5584736089117935 }, { "name": "model.layers.31.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.3075146853225306e-05, "sensitivity": 1.3283786793144876 }, { "name": "model.layers.31.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.401481313223485e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.425007061101496e-05, "sensitivity": 0.8093269055792073 }, { "name": "model.layers.31.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1304039617243689e-05, "sensitivity": 1.6346502932725566 }, { "name": "model.layers.31.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.8674481907510199e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006828908808529377, "sensitivity": 0.5795146250480949 }, { "name": "model.layers.31.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.022580782882869e-05, "sensitivity": 0.7738845698542013 }, { "name": "model.layers.31.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.406168040484772e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006686788401566446, "sensitivity": 0.5631080963940606 }, { "name": "model.layers.31.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.375870725605637e-05, "sensitivity": 0.9030434653779285 }, { "name": "model.layers.31.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.460939741577022e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.35336764389649e-05, "sensitivity": 0.6671240378049691 }, { "name": "model.layers.31.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8716843341244385e-05, "sensitivity": 0.8648350763376629 }, { "name": "model.layers.31.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.855777314740408e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006524638156406581, "sensitivity": 0.5290384567532244 }, { "name": "model.layers.31.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.607050843536854e-05, "sensitivity": 0.894590257243086 }, { "name": "model.layers.31.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.24347694106109e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006378382677212358, "sensitivity": 0.5207844009303269 }, { "name": "model.layers.31.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7830642617773265e-05, "sensitivity": 0.6231027577611008 }, { "name": "model.layers.31.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.521796305809403e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006521535106003284, "sensitivity": 0.539107912431757 }, { "name": "model.layers.31.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.558683526236564e-05, "sensitivity": 0.6299234225508884 }, { "name": "model.layers.31.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0819728686328745e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007361457101069391, "sensitivity": 0.5116815001425605 }, { "name": "model.layers.31.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.356211088132113e-05, "sensitivity": 0.7695195594767232 }, { "name": "model.layers.31.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.574600431325962e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007274709641933441, "sensitivity": 0.5268401927394826 }, { "name": "model.layers.31.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.971819336991757e-05, "sensitivity": 0.6334547217803769 }, { "name": "model.layers.31.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.814804578425537e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006592515856027603, "sensitivity": 0.5430403162978247 }, { "name": "model.layers.31.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.718471948057413e-05, "sensitivity": 0.8860518885336821 }, { "name": "model.layers.31.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.698481567786075e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006593194557353854, "sensitivity": 0.5629133412569021 }, { "name": "model.layers.31.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.433457019738853e-05, "sensitivity": 1.1254282613929973 }, { "name": "model.layers.31.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1986179515588447e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007379350136034191, "sensitivity": 0.5787052113683426 }, { "name": "model.layers.31.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.243315147003159e-05, "sensitivity": 1.1387711831125709 }, { "name": "model.layers.31.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.299813091776741e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007094683824107051, "sensitivity": 0.5533504954977201 }, { "name": "model.layers.31.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.487010978162289e-05, "sensitivity": 0.8870397562972074 }, { "name": "model.layers.31.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.845452950685285e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007366963545791805, "sensitivity": 0.5820904974332545 }, { "name": "model.layers.31.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7183449825970456e-05, "sensitivity": 0.656502066192816 }, { "name": "model.layers.31.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.973290164249192e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006509209633804858, "sensitivity": 0.5411742853127636 }, { "name": "model.layers.31.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1323614671709947e-05, "sensitivity": 1.3312245108474534 }, { "name": "model.layers.31.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.52450057209353e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.21297222096473e-05, "sensitivity": 0.709557071624678 }, { "name": "model.layers.31.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1298370736767538e-05, "sensitivity": 1.4353513722909486 }, { "name": "model.layers.31.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.637795758659195e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.1371079381206073e-05, "sensitivity": 1.2417765141231936 }, { "name": "model.layers.31.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0344551457092166e-05, "sensitivity": 0.651280011400859 }, { "name": "model.layers.31.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.368881031448836e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006832012441009283, "sensitivity": 0.5449003469395284 }, { "name": "model.layers.31.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.100889731897041e-05, "sensitivity": 0.6805697676640046 }, { "name": "model.layers.31.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.011695851768309e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006746221333742142, "sensitivity": 0.5539541937754147 }, { "name": "model.layers.31.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.130707333795726e-05, "sensitivity": 0.898342347826991 }, { "name": "model.layers.31.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.560184028283402e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.240061338758096e-05, "sensitivity": 0.699196286363331 }, { "name": "model.layers.31.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.455281254602596e-05, "sensitivity": 0.6060145630080613 }, { "name": "model.layers.31.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.114626328075246e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007253969088196754, "sensitivity": 0.5264872277296274 }, { "name": "model.layers.31.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.352518539642915e-05, "sensitivity": 0.9021443910946008 }, { "name": "model.layers.31.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.693615202697401e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007116659544408321, "sensitivity": 0.5444819090803857 }, { "name": "model.layers.31.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.693281855201349e-05, "sensitivity": 0.8406657801146122 }, { "name": "model.layers.31.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.154355800281337e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000648379442282021, "sensitivity": 0.5485529437568162 }, { "name": "model.layers.31.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.49531721137464e-05, "sensitivity": 0.8533022512698942 }, { "name": "model.layers.31.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0707019555411534e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007387680816464126, "sensitivity": 0.5947496587679157 }, { "name": "model.layers.31.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0446146916365251e-05, "sensitivity": 1.8687426565065384 }, { "name": "model.layers.31.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.578119263802364e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.948282341705635e-05, "sensitivity": 0.8644843626500631 }, { "name": "model.layers.31.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006728979060426354, "sensitivity": 0.5286270315974673 }, { "name": "model.layers.31.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.810951163060963e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006890149670653045, "sensitivity": 0.5334115081374763 }, { "name": "model.layers.31.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0842823940038215e-05, "sensitivity": 1.2807508756914276 }, { "name": "model.layers.31.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6346336906281067e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006495722918771207, "sensitivity": 0.5898554595158239 }, { "name": "model.layers.31.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.640401261392981e-05, "sensitivity": 0.9279391272750697 }, { "name": "model.layers.31.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.424829047726234e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.593161378987134e-05, "sensitivity": 0.781532215612114 }, { "name": "model.layers.31.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4921521344367648e-06, "sensitivity": 2.0377173950635514 }, { "name": "model.layers.31.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.517529413940792e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007034411537460983, "sensitivity": 0.5831895966959659 }, { "name": "model.layers.31.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007116184569895267, "sensitivity": 0.5167591744493841 }, { "name": "model.layers.31.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.56876908983395e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007220436818897724, "sensitivity": 0.538829350031002 }, { "name": "model.layers.31.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.998825508868322e-05, "sensitivity": 1.0081319464927576 }, { "name": "model.layers.31.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0649193882272812e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.948321631876752e-05, "sensitivity": 0.7711673381502773 }, { "name": "model.layers.31.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.886694270884618e-05, "sensitivity": 0.8075581139603659 }, { "name": "model.layers.31.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.013052155940386e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.973217048449442e-05, "sensitivity": 0.673664175340692 }, { "name": "model.layers.31.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.21599901933223e-05, "sensitivity": 0.6508413306085191 }, { "name": "model.layers.31.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.250984819824225e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.1500642914325e-05, "sensitivity": 0.6049076723641859 }, { "name": "model.layers.31.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006808378966525197, "sensitivity": 0.5208643844970862 }, { "name": "model.layers.31.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.783395747333998e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006754760397598147, "sensitivity": 0.538272997584305 }, { "name": "model.layers.31.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007046404061838984, "sensitivity": 0.568389341079643 }, { "name": "model.layers.31.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.029593120932986e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007014821167103946, "sensitivity": 0.5339323282858275 }, { "name": "model.layers.31.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006812801002524793, "sensitivity": 0.5453009281263134 }, { "name": "model.layers.31.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.037923523967038e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007010138942860067, "sensitivity": 0.5404320787283657 }, { "name": "model.layers.31.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.81870078551583e-05, "sensitivity": 0.7702119661717827 }, { "name": "model.layers.31.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.47266846903949e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008017338695935905, "sensitivity": 0.5350504548180041 }, { "name": "model.layers.31.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.913656059419736e-05, "sensitivity": 0.7901492028913242 }, { "name": "model.layers.31.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.042073543241713e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006699702935293317, "sensitivity": 0.5503786042450737 }, { "name": "model.layers.31.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.406678585335612e-05, "sensitivity": 0.7009094963382627 }, { "name": "model.layers.31.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.659405577622238e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007090986473485827, "sensitivity": 0.5265877850917609 }, { "name": "model.layers.31.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.886701910640113e-05, "sensitivity": 0.7843673569548426 }, { "name": "model.layers.31.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.284968776526512e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000662897014990449, "sensitivity": 0.526075505707002 }, { "name": "model.layers.31.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006759184179827571, "sensitivity": 0.5187657813125973 }, { "name": "model.layers.31.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.443279971790616e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006654299795627594, "sensitivity": 0.5557285372885824 }, { "name": "model.layers.31.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007128709694370627, "sensitivity": 0.5862122609632472 }, { "name": "model.layers.31.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.851219265830878e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007100088405422866, "sensitivity": 0.5321009028753962 }, { "name": "model.layers.31.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.917869202676229e-05, "sensitivity": 0.7439762383398979 }, { "name": "model.layers.31.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0575116675681784e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8772682677954435e-05, "sensitivity": 0.6697990741169153 }, { "name": "model.layers.31.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.267271237447858e-05, "sensitivity": 0.6693018300641805 }, { "name": "model.layers.31.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0351918717788067e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007131524616852403, "sensitivity": 0.5553862804516791 }, { "name": "model.layers.31.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.571525980485603e-05, "sensitivity": 0.7593574912346379 }, { "name": "model.layers.31.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.50231811505364e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006214475142769516, "sensitivity": 0.5186585832806565 }, { "name": "model.layers.31.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007052220171317458, "sensitivity": 0.5543268492316018 }, { "name": "model.layers.31.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.105981580934895e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007125932606868446, "sensitivity": 0.5515786949927082 }, { "name": "model.layers.31.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006962413317523897, "sensitivity": 0.5385200483808844 }, { "name": "model.layers.31.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.852926273699268e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006926399655640125, "sensitivity": 0.5405527167675919 }, { "name": "model.layers.31.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.170654523884878e-05, "sensitivity": 1.1100872987952222 }, { "name": "model.layers.31.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.091602469699865e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006956871366128325, "sensitivity": 0.5360212011740967 }, { "name": "model.layers.31.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.15095705143176e-05, "sensitivity": 0.6811563517245001 }, { "name": "model.layers.31.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.374716801678005e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007062244112603366, "sensitivity": 0.5287654391470051 }, { "name": "model.layers.31.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3609932213730644e-06, "sensitivity": 2.023153175088108 }, { "name": "model.layers.31.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.27149473883037e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006437036208808422, "sensitivity": 0.5416564376507254 }, { "name": "model.layers.31.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.237586785573512e-05, "sensitivity": 0.7100317415014715 }, { "name": "model.layers.31.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2045081803080393e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007157950894907117, "sensitivity": 0.5899702485633888 }, { "name": "model.layers.31.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006820306880399585, "sensitivity": 0.5833699612789833 }, { "name": "model.layers.31.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.224387784139253e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006842842558398843, "sensitivity": 0.5018189453865229 }, { "name": "model.layers.31.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007270959904417396, "sensitivity": 0.5259081677053208 }, { "name": "model.layers.31.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.301316031771421e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007231729105114937, "sensitivity": 0.5514941835225439 }, { "name": "model.layers.31.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1107618774985895e-05, "sensitivity": 1.4002047695620259 }, { "name": "model.layers.31.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.255491497431649e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006731553003191948, "sensitivity": 0.5585212465689661 }, { "name": "model.layers.31.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1154217645525932e-05, "sensitivity": 1.4385724265204927 }, { "name": "model.layers.31.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.069547223181871e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006714066839776933, "sensitivity": 0.5192027185299167 }, { "name": "model.layers.31.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007347787613980472, "sensitivity": 0.5125204700049452 }, { "name": "model.layers.31.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.318411346408539e-07, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007288306951522827, "sensitivity": 0.587615550700303 }, { "name": "model.layers.31.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 3.210554496035911e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.2065328266762663e-06, "sensitivity": 2.1003828096964607 }, { "name": "model.layers.31.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0882532706091297e-06, "sensitivity": 10.0 }, { "name": "model.layers.31.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.7383321164743393e-06, "sensitivity": 2.1022655755006223 }, { "name": "model.layers.31.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 3.1080002372618765e-05, "sensitivity": 1.843732268177789 }, { "name": "model.layers.31.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00022236672521103173, "sensitivity": 1.0170271287880843 }, { "name": "model.layers.31.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.5215414350677747e-05, "sensitivity": 1.6214888361845718 }, { "name": "model.layers.31.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 4.782108590006828e-05, "sensitivity": 0.7004973790226638 }, { "name": "model.layers.31.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00032895314507186413, "sensitivity": 0.9240737662961647 }, { "name": "model.layers.32.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.606420381809585e-05, "sensitivity": 0.9649362148635467 }, { "name": "model.layers.32.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.942946578827105e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006692299502901733, "sensitivity": 0.5460937836512545 }, { "name": "model.layers.32.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.264478724915534e-05, "sensitivity": 0.6099876155725494 }, { "name": "model.layers.32.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.525389603164513e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007197638042271137, "sensitivity": 0.5200105510464363 }, { "name": "model.layers.32.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.177735485835001e-05, "sensitivity": 0.6629840281453379 }, { "name": "model.layers.32.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.793670420142007e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006975379656068981, "sensitivity": 0.5561546745096749 }, { "name": "model.layers.32.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0763587852125056e-05, "sensitivity": 1.2589342310986502 }, { "name": "model.layers.32.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0428508403492742e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006716895732097328, "sensitivity": 0.5662512122030134 }, { "name": "model.layers.32.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7890323660103604e-05, "sensitivity": 0.6347098733428269 }, { "name": "model.layers.32.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.321653245322523e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006427511107176542, "sensitivity": 0.5346122988248505 }, { "name": "model.layers.32.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0927504263236187e-05, "sensitivity": 1.501595800691353 }, { "name": "model.layers.32.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.199421810990316e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006697450298815966, "sensitivity": 0.5411569095923207 }, { "name": "model.layers.32.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8642639487516135e-05, "sensitivity": 1.1739049069702896 }, { "name": "model.layers.32.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0378830666013528e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.792958472738974e-05, "sensitivity": 0.6776969188811238 }, { "name": "model.layers.32.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.162956560729071e-05, "sensitivity": 0.6174896995213673 }, { "name": "model.layers.32.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.686778644711012e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000701658776961267, "sensitivity": 0.5410541531080846 }, { "name": "model.layers.32.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0450092860264704e-05, "sensitivity": 1.1273146457985566 }, { "name": "model.layers.32.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.025373290365678e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006752379122190177, "sensitivity": 0.5294148411093001 }, { "name": "model.layers.32.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0923674381047022e-05, "sensitivity": 1.2377859391467771 }, { "name": "model.layers.32.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1817268159575178e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.853161565028131e-05, "sensitivity": 0.6383737555960157 }, { "name": "model.layers.32.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.48640125291422e-05, "sensitivity": 0.8251090696989805 }, { "name": "model.layers.32.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.488242085353704e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007383585325442255, "sensitivity": 0.5300407158467315 }, { "name": "model.layers.32.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.207423575688154e-05, "sensitivity": 0.7946880630124619 }, { "name": "model.layers.32.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.779234240639198e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.178009061841294e-05, "sensitivity": 0.607340278864307 }, { "name": "model.layers.32.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.113674317020923e-05, "sensitivity": 0.6132008277580436 }, { "name": "model.layers.32.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.503631872576079e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006904994370415807, "sensitivity": 0.4919487280778674 }, { "name": "model.layers.32.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.943081825738773e-05, "sensitivity": 0.7095702993013553 }, { "name": "model.layers.32.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.344419388260576e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007908889092504978, "sensitivity": 0.528887365592974 }, { "name": "model.layers.32.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.227463018149137e-05, "sensitivity": 0.633281353503186 }, { "name": "model.layers.32.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4148527043289505e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.405655585695058e-05, "sensitivity": 0.7681167398438503 }, { "name": "model.layers.32.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1613003152888268e-05, "sensitivity": 1.4652860008941089 }, { "name": "model.layers.32.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5658297343179584e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.480098818428814e-05, "sensitivity": 0.6678229223136656 }, { "name": "model.layers.32.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.223351682710927e-05, "sensitivity": 1.2602449860418625 }, { "name": "model.layers.32.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2119387520215241e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.807866884628311e-05, "sensitivity": 0.9876875747720937 }, { "name": "model.layers.32.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.837734690634534e-05, "sensitivity": 0.7889816088325164 }, { "name": "model.layers.32.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.310826953878859e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007940231589600444, "sensitivity": 0.5613844542270392 }, { "name": "model.layers.32.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.75334343011491e-05, "sensitivity": 0.8937335580408019 }, { "name": "model.layers.32.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.304001883312594e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006605214439332485, "sensitivity": 0.5664894246302907 }, { "name": "model.layers.32.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.292965215630829e-05, "sensitivity": 0.6327678393903684 }, { "name": "model.layers.32.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.056773938529659e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005934405489824712, "sensitivity": 0.5736928104195572 }, { "name": "model.layers.32.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.077988235920202e-05, "sensitivity": 1.607922855116103 }, { "name": "model.layers.32.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.693185691299732e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006635033059865236, "sensitivity": 0.5264583360594192 }, { "name": "model.layers.32.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.262138776946813e-05, "sensitivity": 1.0255864866149005 }, { "name": "model.layers.32.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1951515261898749e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007082329830154777, "sensitivity": 0.5386833049611613 }, { "name": "model.layers.32.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.717349631595425e-05, "sensitivity": 1.1645337476644635 }, { "name": "model.layers.32.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.063376203092048e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6595290516270325e-05, "sensitivity": 0.6741938063173372 }, { "name": "model.layers.32.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006903344765305519, "sensitivity": 0.5904269513248983 }, { "name": "model.layers.32.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.936674132404733e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006825685268267989, "sensitivity": 0.575232272570484 }, { "name": "model.layers.32.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4613337852060795e-05, "sensitivity": 0.8231950585458379 }, { "name": "model.layers.32.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.90253125160234e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.697091546608135e-05, "sensitivity": 0.9315570205131368 }, { "name": "model.layers.32.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.956495806458406e-05, "sensitivity": 0.9557852232681884 }, { "name": "model.layers.32.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0277642559231026e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.93583972658962e-05, "sensitivity": 0.6632908220734861 }, { "name": "model.layers.32.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.818991849082522e-05, "sensitivity": 0.788923386559863 }, { "name": "model.layers.32.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.086329899015254e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006477299029938877, "sensitivity": 0.5401601777353245 }, { "name": "model.layers.32.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.930311090196483e-05, "sensitivity": 0.976002747168798 }, { "name": "model.layers.32.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0261964007440838e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006750712636858225, "sensitivity": 0.5635334888929803 }, { "name": "model.layers.32.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.726619201595895e-05, "sensitivity": 0.641452012568015 }, { "name": "model.layers.32.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.734861012271722e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006624259403906763, "sensitivity": 0.544644950746431 }, { "name": "model.layers.32.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.987042823107913e-05, "sensitivity": 0.8828869072055597 }, { "name": "model.layers.32.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1114946119050728e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006926789646968246, "sensitivity": 0.5418076702668061 }, { "name": "model.layers.32.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.834604235133156e-05, "sensitivity": 0.7405520023711487 }, { "name": "model.layers.32.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.418398351750511e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006570319528691471, "sensitivity": 0.5141282953767896 }, { "name": "model.layers.32.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.156949191587046e-05, "sensitivity": 0.6975456027996739 }, { "name": "model.layers.32.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.852090675442014e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005866794381290674, "sensitivity": 0.5355309593464829 }, { "name": "model.layers.32.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1322632417432033e-05, "sensitivity": 1.6692574026486922 }, { "name": "model.layers.32.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.513217284809798e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.322185072349384e-05, "sensitivity": 1.009470402418739 }, { "name": "model.layers.32.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.60502776352223e-05, "sensitivity": 0.9767531550004218 }, { "name": "model.layers.32.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.238066809302836e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006358891259878874, "sensitivity": 0.5474379857543366 }, { "name": "model.layers.32.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.143245263956487e-05, "sensitivity": 0.6645565415599884 }, { "name": "model.layers.32.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.034397428156808e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006905384361743927, "sensitivity": 0.536319254804999 }, { "name": "model.layers.32.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006973270210437477, "sensitivity": 0.5914682546704799 }, { "name": "model.layers.32.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.33702870295383e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006880580331198871, "sensitivity": 0.5122294213799852 }, { "name": "model.layers.32.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.46451226202771e-05, "sensitivity": 0.6096137852475064 }, { "name": "model.layers.32.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0226520998912747e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007687066681683064, "sensitivity": 0.5449326301095927 }, { "name": "model.layers.32.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.88187322136946e-05, "sensitivity": 1.1217431541954221 }, { "name": "model.layers.32.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.720090025031823e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006576607702299953, "sensitivity": 0.5255462002375895 }, { "name": "model.layers.32.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.061435068550054e-05, "sensitivity": 1.3791163924063794 }, { "name": "model.layers.32.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4111644759395858e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.700270412489772e-05, "sensitivity": 0.6867830933798955 }, { "name": "model.layers.32.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.149924355559051e-05, "sensitivity": 1.6517615031878943 }, { "name": "model.layers.32.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2194500413897913e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007148664444684982, "sensitivity": 0.5783521112848677 }, { "name": "model.layers.32.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.497354479506612e-05, "sensitivity": 0.8692732489609256 }, { "name": "model.layers.32.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.327180012202007e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.663645035587251e-05, "sensitivity": 0.6413145332981645 }, { "name": "model.layers.32.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.786193651147187e-05, "sensitivity": 0.9475612173446171 }, { "name": "model.layers.32.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.365259418496862e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006625970709137619, "sensitivity": 0.5255912123004578 }, { "name": "model.layers.32.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0621602996252477e-05, "sensitivity": 1.3041878290975055 }, { "name": "model.layers.32.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.459179076045984e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00066731235710904, "sensitivity": 0.5554847187382739 }, { "name": "model.layers.32.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1093470675405115e-05, "sensitivity": 1.6966364016660584 }, { "name": "model.layers.32.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.985550152829092e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006767305894754827, "sensitivity": 0.5519867812408302 }, { "name": "model.layers.32.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.912702908972278e-05, "sensitivity": 1.1945746090293157 }, { "name": "model.layers.32.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.29153884499101e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006620024796575308, "sensitivity": 0.5961163561237249 }, { "name": "model.layers.32.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.641099753323942e-05, "sensitivity": 0.7618022512305784 }, { "name": "model.layers.32.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.094386091921479e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007610111497342587, "sensitivity": 0.543890354517218 }, { "name": "model.layers.32.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0864898285944946e-05, "sensitivity": 1.3278826991831658 }, { "name": "model.layers.32.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.485449262072507e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006556726293638349, "sensitivity": 0.5221055768649021 }, { "name": "model.layers.32.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0852518244064413e-05, "sensitivity": 1.5022062002047027 }, { "name": "model.layers.32.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6679796317475848e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8271409216104075e-05, "sensitivity": 0.7848804845523457 }, { "name": "model.layers.32.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.118597957538441e-05, "sensitivity": 0.7279647885219872 }, { "name": "model.layers.32.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.100060201992164e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006762716802768409, "sensitivity": 0.5568235860719813 }, { "name": "model.layers.32.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0816091718152165e-05, "sensitivity": 1.1811710406826106 }, { "name": "model.layers.32.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.248739848364494e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006897016428411007, "sensitivity": 0.5520486158114044 }, { "name": "model.layers.32.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.088835961127188e-05, "sensitivity": 1.431903240480181 }, { "name": "model.layers.32.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.901120173097297e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.988491466268897e-05, "sensitivity": 0.6567586809324092 }, { "name": "model.layers.32.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0976272278639954e-05, "sensitivity": 1.6874613005047479 }, { "name": "model.layers.32.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.027610096571152e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.808612331748009e-05, "sensitivity": 0.6295627774539856 }, { "name": "model.layers.32.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6672259233891964e-05, "sensitivity": 1.1628600132126823 }, { "name": "model.layers.32.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.664439405947633e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7695531722856686e-05, "sensitivity": 0.6720524465342259 }, { "name": "model.layers.32.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.770161341293715e-06, "sensitivity": 1.4911669168210928 }, { "name": "model.layers.32.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.8191164953314e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5719472584314644e-05, "sensitivity": 0.6040836071643793 }, { "name": "model.layers.32.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.729196345782839e-05, "sensitivity": 0.750060990485751 }, { "name": "model.layers.32.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.850198239291785e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006503543118014932, "sensitivity": 0.568819311109846 }, { "name": "model.layers.32.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.162931094877422e-05, "sensitivity": 0.7559608344590685 }, { "name": "model.layers.32.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.729560707048222e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006857152911834419, "sensitivity": 0.5387041399548603 }, { "name": "model.layers.32.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0470132110640407e-05, "sensitivity": 1.6138631517426663 }, { "name": "model.layers.32.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0311041478416882e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006508991355076432, "sensitivity": 0.5960613613684032 }, { "name": "model.layers.32.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.801668157801032e-05, "sensitivity": 0.9609576704625854 }, { "name": "model.layers.32.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0155936251976527e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.880543903913349e-05, "sensitivity": 0.6126103347116535 }, { "name": "model.layers.32.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.923404387431219e-05, "sensitivity": 0.9117298660508 }, { "name": "model.layers.32.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.553265959359123e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006588222458958626, "sensitivity": 0.5224879816870988 }, { "name": "model.layers.32.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.300793756963685e-05, "sensitivity": 1.1258251176220837 }, { "name": "model.layers.32.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.623611963936128e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.425791070796549e-05, "sensitivity": 0.6552531582772733 }, { "name": "model.layers.32.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.612989091081545e-05, "sensitivity": 0.7769363950520056 }, { "name": "model.layers.32.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0204964837612351e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.777502130717039e-05, "sensitivity": 0.6203038813845021 }, { "name": "model.layers.32.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1042657206417061e-05, "sensitivity": 1.4944535653989512 }, { "name": "model.layers.32.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1706025588864577e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006827153265476227, "sensitivity": 0.5392869724940161 }, { "name": "model.layers.32.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.2736039682058617e-06, "sensitivity": 2.0972518681062153 }, { "name": "model.layers.32.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.123725029283378e-07, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006308412412181497, "sensitivity": 0.5320360514649368 }, { "name": "model.layers.32.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.597793253604323e-05, "sensitivity": 0.699485763742341 }, { "name": "model.layers.32.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2323173450567992e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.563225178979337e-05, "sensitivity": 0.6569452509575985 }, { "name": "model.layers.32.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 2.9369743970164564e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.440627440591925e-06, "sensitivity": 2.1015494996697015 }, { "name": "model.layers.32.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3235816140877432e-06, "sensitivity": 10.0 }, { "name": "model.layers.32.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.6230035271291854e-06, "sensitivity": 2.10147411484859 }, { "name": "model.layers.32.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 4.29903193435166e-05, "sensitivity": 1.8097854934768456 }, { "name": "model.layers.32.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00022153585450723767, "sensitivity": 1.1512106715504524 }, { "name": "model.layers.32.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.786085522326175e-05, "sensitivity": 1.5227144173150438 }, { "name": "model.layers.32.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.2333456551423296e-05, "sensitivity": 0.7690258458586214 }, { "name": "model.layers.32.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0003518016601447016, "sensitivity": 0.7687551116241086 }, { "name": "model.layers.33.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0935173122561537e-05, "sensitivity": 1.357327172259768 }, { "name": "model.layers.33.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.705648729621316e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006763027049601078, "sensitivity": 0.5425801130602861 }, { "name": "model.layers.33.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4263597121462226e-05, "sensitivity": 0.7615885643962059 }, { "name": "model.layers.33.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.873074423514481e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006472980603575706, "sensitivity": 0.5780588861750796 }, { "name": "model.layers.33.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.469827349064872e-05, "sensitivity": 0.6798072314704586 }, { "name": "model.layers.33.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.03966599960404e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007459461921826005, "sensitivity": 0.5276968366631059 }, { "name": "model.layers.33.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006316097569651902, "sensitivity": 0.5349558568507965 }, { "name": "model.layers.33.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.361397026921622e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006321565015241504, "sensitivity": 0.5458833379534402 }, { "name": "model.layers.33.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.135971489129588e-05, "sensitivity": 0.7460046571106476 }, { "name": "model.layers.33.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.168358706621802e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007078958442434669, "sensitivity": 0.5368272350668164 }, { "name": "model.layers.33.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.729952681576833e-05, "sensitivity": 1.005330055097516 }, { "name": "model.layers.33.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.819968234594853e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006445999606512487, "sensitivity": 0.5786093229507147 }, { "name": "model.layers.33.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.260191003093496e-05, "sensitivity": 0.6770907701562731 }, { "name": "model.layers.33.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.043189058691496e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007033710135146976, "sensitivity": 0.5313038625979651 }, { "name": "model.layers.33.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.838399374624714e-05, "sensitivity": 0.8270816930553891 }, { "name": "model.layers.33.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6106696421047673e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006431511137634516, "sensitivity": 0.5564183440244777 }, { "name": "model.layers.33.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.270313315326348e-05, "sensitivity": 0.8369618487093129 }, { "name": "model.layers.33.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.218565656330611e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007056035101413727, "sensitivity": 0.5030787924748258 }, { "name": "model.layers.33.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.142993824032601e-05, "sensitivity": 1.2552058876098209 }, { "name": "model.layers.33.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.182852641562931e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.145790393929929e-05, "sensitivity": 0.6185768920278032 }, { "name": "model.layers.33.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007285535102710128, "sensitivity": 0.591301711522398 }, { "name": "model.layers.33.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.228709364426322e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007371436222456396, "sensitivity": 0.5288844679546147 }, { "name": "model.layers.33.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0536215086176526e-05, "sensitivity": 1.6551706290648724 }, { "name": "model.layers.33.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.28241673186858e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000636975048109889, "sensitivity": 0.5330480206998189 }, { "name": "model.layers.33.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8517864090390503e-05, "sensitivity": 0.987096900910117 }, { "name": "model.layers.33.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2603449022208224e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0065674915676937e-05, "sensitivity": 0.7208401319564457 }, { "name": "model.layers.33.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.103645137045532e-05, "sensitivity": 0.7341119995284257 }, { "name": "model.layers.33.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.435224915752769e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006838801200501621, "sensitivity": 0.5234124011691028 }, { "name": "model.layers.33.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.038291520671919e-05, "sensitivity": 1.2630671169493808 }, { "name": "model.layers.33.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3509536529454635e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5470529332524166e-05, "sensitivity": 0.6543379455242903 }, { "name": "model.layers.33.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.04270571784582e-05, "sensitivity": 0.6410350560528156 }, { "name": "model.layers.33.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.754142987119849e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006652912124991417, "sensitivity": 0.5364102600073827 }, { "name": "model.layers.33.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.664220589096658e-05, "sensitivity": 1.1753439808706065 }, { "name": "model.layers.33.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.851198802200088e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006533404812216759, "sensitivity": 0.5644819776062547 }, { "name": "model.layers.33.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.954558193683624e-05, "sensitivity": 0.9935864562441132 }, { "name": "model.layers.33.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0105986802955158e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008267539087682962, "sensitivity": 0.5231779749237354 }, { "name": "model.layers.33.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.707211676053703e-05, "sensitivity": 0.9523878565103993 }, { "name": "model.layers.33.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.620360176792019e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006609453703276813, "sensitivity": 0.5486342466791894 }, { "name": "model.layers.33.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.981654248898849e-05, "sensitivity": 1.049382744147329 }, { "name": "model.layers.33.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.144900220941054e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000694672460667789, "sensitivity": 0.5573886649541657 }, { "name": "model.layers.33.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.840116864419542e-05, "sensitivity": 0.7007606732434328 }, { "name": "model.layers.33.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.160467134781356e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006809725309722126, "sensitivity": 0.5245818136462933 }, { "name": "model.layers.33.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.472400855273008e-05, "sensitivity": 0.7222306268444341 }, { "name": "model.layers.33.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.841855899139773e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007193984347395599, "sensitivity": 0.5736848635520844 }, { "name": "model.layers.33.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.270361336646602e-05, "sensitivity": 0.7462664473709852 }, { "name": "model.layers.33.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.332689051509078e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007026779348962009, "sensitivity": 0.5964102161219762 }, { "name": "model.layers.33.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1540137165866327e-05, "sensitivity": 1.3200462056435762 }, { "name": "model.layers.33.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2862459470852627e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007162190740928054, "sensitivity": 0.5665443546093911 }, { "name": "model.layers.33.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.631584983551875e-05, "sensitivity": 0.6221435639344549 }, { "name": "model.layers.33.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.86304894973e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007309670327231288, "sensitivity": 0.5288485675752805 }, { "name": "model.layers.33.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006649877759627998, "sensitivity": 0.5531085070067545 }, { "name": "model.layers.33.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.212170203274582e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006966012879274786, "sensitivity": 0.5223196463255826 }, { "name": "model.layers.33.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.111067341407761e-05, "sensitivity": 0.6063809839654098 }, { "name": "model.layers.33.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.369437409783131e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006940590683370829, "sensitivity": 0.5454365129767295 }, { "name": "model.layers.33.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.365760110478732e-06, "sensitivity": 2.097621653795591 }, { "name": "model.layers.33.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5414528888868517e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.688913370249793e-05, "sensitivity": 0.98808022228594 }, { "name": "model.layers.33.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.781790241599083e-05, "sensitivity": 1.0281725923848852 }, { "name": "model.layers.33.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0554360869718948e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.552550283027813e-05, "sensitivity": 0.6903858039244625 }, { "name": "model.layers.33.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006442618323490024, "sensitivity": 0.5155975118527106 }, { "name": "model.layers.33.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.782804007343657e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006780314142815769, "sensitivity": 0.5487423742330373 }, { "name": "model.layers.33.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.974509258521721e-05, "sensitivity": 1.1192805685714602 }, { "name": "model.layers.33.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.075738282452221e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006774912471882999, "sensitivity": 0.5517737643408825 }, { "name": "model.layers.33.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.678359229932539e-05, "sensitivity": 0.8526137220352447 }, { "name": "model.layers.33.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.300659939981415e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.179579941090196e-05, "sensitivity": 0.6074110225524557 }, { "name": "model.layers.33.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.734213482355699e-05, "sensitivity": 1.0822690994136364 }, { "name": "model.layers.33.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.780969776329584e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006309857708401978, "sensitivity": 0.5839953304638935 }, { "name": "model.layers.33.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7126220781356096e-05, "sensitivity": 0.9532127577608518 }, { "name": "model.layers.33.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.448053906955465e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006521969335153699, "sensitivity": 0.5647707353599619 }, { "name": "model.layers.33.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0840587492566556e-05, "sensitivity": 1.3058036265875321 }, { "name": "model.layers.33.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.547608215143555e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006398960249498487, "sensitivity": 0.5323489424195229 }, { "name": "model.layers.33.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.301819666987285e-05, "sensitivity": 0.8448436419194202 }, { "name": "model.layers.33.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.448611990592326e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007058662595227361, "sensitivity": 0.5115687684135026 }, { "name": "model.layers.33.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007059999625198543, "sensitivity": 0.5855556406120271 }, { "name": "model.layers.33.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.43421594506799e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000725842546671629, "sensitivity": 0.5614629736439508 }, { "name": "model.layers.33.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.097492223489098e-05, "sensitivity": 0.7803281637406261 }, { "name": "model.layers.33.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.959256885849754e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006831944920122623, "sensitivity": 0.5540704069247394 }, { "name": "model.layers.33.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0611331163090654e-05, "sensitivity": 1.804780818972745 }, { "name": "model.layers.33.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2348932614258956e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006621351349167526, "sensitivity": 0.5911216337356009 }, { "name": "model.layers.33.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.907185186515562e-05, "sensitivity": 0.9186351825095878 }, { "name": "model.layers.33.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.340053909705603e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006756647489964962, "sensitivity": 0.5442121353797494 }, { "name": "model.layers.33.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006402754806913435, "sensitivity": 0.5889837128485109 }, { "name": "model.layers.33.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.516291589126922e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006688520079478621, "sensitivity": 0.5492975247105738 }, { "name": "model.layers.33.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8962494222214445e-05, "sensitivity": 0.9597710439923124 }, { "name": "model.layers.33.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.995133953249024e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006515582790598273, "sensitivity": 0.5345284045073841 }, { "name": "model.layers.33.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.266385753406212e-05, "sensitivity": 0.763485597459077 }, { "name": "model.layers.33.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.129837851811317e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007119818474166095, "sensitivity": 0.5480128400264495 }, { "name": "model.layers.33.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.014424070599489e-05, "sensitivity": 0.9767099472132139 }, { "name": "model.layers.33.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.73860642514046e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000660466670524329, "sensitivity": 0.5348862709773149 }, { "name": "model.layers.33.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0826212575193495e-05, "sensitivity": 0.6431945885094759 }, { "name": "model.layers.33.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.468199214599736e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000676833325996995, "sensitivity": 0.5672931860942725 }, { "name": "model.layers.33.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0782342542370316e-05, "sensitivity": 1.254290353125612 }, { "name": "model.layers.33.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4660097349405987e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006819835398346186, "sensitivity": 0.5940434178596681 }, { "name": "model.layers.33.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.503813448129222e-06, "sensitivity": 2.097163744272483 }, { "name": "model.layers.33.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1674818551909993e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007026073872111738, "sensitivity": 0.5516120981899584 }, { "name": "model.layers.33.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 3.0344267543114256e-06, "sensitivity": 2.097748487121366 }, { "name": "model.layers.33.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3900751127948752e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.117284985724837e-05, "sensitivity": 0.8326120800339636 }, { "name": "model.layers.33.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0172751899517607e-05, "sensitivity": 1.5510321080370402 }, { "name": "model.layers.33.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.529762686113827e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006110860267654061, "sensitivity": 0.527406858482833 }, { "name": "model.layers.33.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.050019874237478e-05, "sensitivity": 1.0926827090735687 }, { "name": "model.layers.33.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.249111733159225e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006709519657306373, "sensitivity": 0.5630642421704241 }, { "name": "model.layers.33.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007128085708245635, "sensitivity": 0.5714003560040491 }, { "name": "model.layers.33.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.224858791232691e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.416437099687755e-05, "sensitivity": 0.7218997861590706 }, { "name": "model.layers.33.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7248860684921965e-05, "sensitivity": 0.8204434380490525 }, { "name": "model.layers.33.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.365882422367577e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006531433900818229, "sensitivity": 0.5685186197723048 }, { "name": "model.layers.33.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.972789949737489e-05, "sensitivity": 0.65540285897746 }, { "name": "model.layers.33.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.27271264824958e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006736629875376821, "sensitivity": 0.5075015005900184 }, { "name": "model.layers.33.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1311136404401623e-05, "sensitivity": 1.3503657040868013 }, { "name": "model.layers.33.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.215009532046679e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007219213293865323, "sensitivity": 0.5971190924311695 }, { "name": "model.layers.33.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.284036498982459e-05, "sensitivity": 0.8509925800705197 }, { "name": "model.layers.33.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.554519238008652e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007166103459894657, "sensitivity": 0.5647492108672031 }, { "name": "model.layers.33.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.168246909510344e-05, "sensitivity": 1.04754971877923 }, { "name": "model.layers.33.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.519450034327747e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007020856137387455, "sensitivity": 0.5334680301849597 }, { "name": "model.layers.33.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0471141649759375e-05, "sensitivity": 1.3403094610138757 }, { "name": "model.layers.33.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0331198154744925e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000673146394547075, "sensitivity": 0.5688206150499103 }, { "name": "model.layers.33.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.295336061157286e-05, "sensitivity": 0.7989876692501868 }, { "name": "model.layers.33.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.549392648797948e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007211660849861801, "sensitivity": 0.5248376588812804 }, { "name": "model.layers.33.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007112195598892868, "sensitivity": 0.5255299531752364 }, { "name": "model.layers.33.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.623452802363317e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007234588265419006, "sensitivity": 0.5439883432967989 }, { "name": "model.layers.33.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.519117596326396e-05, "sensitivity": 1.0808462741734104 }, { "name": "model.layers.33.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.220356448873645e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.658092024736106e-05, "sensitivity": 0.6587357752690652 }, { "name": "model.layers.33.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.634475019178353e-05, "sensitivity": 0.8846579596170361 }, { "name": "model.layers.33.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.141318193731422e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006379438564181328, "sensitivity": 0.5428039654811827 }, { "name": "model.layers.33.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.922419222770259e-05, "sensitivity": 0.7394532911512341 }, { "name": "model.layers.33.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.063754310365766e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006797193782404065, "sensitivity": 0.5173129155920932 }, { "name": "model.layers.33.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.496974674519151e-05, "sensitivity": 0.782823637961614 }, { "name": "model.layers.33.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.36455831429339e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007271577487699687, "sensitivity": 0.5261445730604687 }, { "name": "model.layers.33.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.130732799647376e-05, "sensitivity": 0.7705933063296202 }, { "name": "model.layers.33.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.255551051661314e-07, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006846903706900775, "sensitivity": 0.5711103829369704 }, { "name": "model.layers.33.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 2.7226280963077443e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3698721633991227e-06, "sensitivity": 2.1016800938131195 }, { "name": "model.layers.33.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3968805205877288e-06, "sensitivity": 10.0 }, { "name": "model.layers.33.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.632758312553051e-06, "sensitivity": 2.1022399157547405 }, { "name": "model.layers.33.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 3.7790461647091433e-05, "sensitivity": 1.8815554419241358 }, { "name": "model.layers.33.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 4, "mse": 3.280419696238823e-05, "sensitivity": 1.2487906536674969 }, { "name": "model.layers.33.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.4641578673035838e-05, "sensitivity": 1.3577588312486972 }, { "name": "model.layers.33.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.6579941883683205e-05, "sensitivity": 0.7668126065899651 }, { "name": "model.layers.33.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002731051354203373, "sensitivity": 1.1042670175269305 }, { "name": "model.layers.34.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006829413468949497, "sensitivity": 0.5584614934395276 }, { "name": "model.layers.34.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.036297802187619e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006753777852281928, "sensitivity": 0.5317845838290897 }, { "name": "model.layers.34.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.931530904490501e-05, "sensitivity": 1.1392925896592292 }, { "name": "model.layers.34.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3701513807973242e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006764413556084037, "sensitivity": 0.545735626949245 }, { "name": "model.layers.34.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.071657844586298e-05, "sensitivity": 0.6819437489607418 }, { "name": "model.layers.34.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1052582067350158e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.988156044622883e-05, "sensitivity": 0.6260624585106176 }, { "name": "model.layers.34.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.067240610718727e-05, "sensitivity": 0.7864097756373085 }, { "name": "model.layers.34.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.604682418284938e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006964824860915542, "sensitivity": 0.5237862097189798 }, { "name": "model.layers.34.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.977919136057608e-05, "sensitivity": 0.8530142435768685 }, { "name": "model.layers.34.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.60322381615697e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006631655851379037, "sensitivity": 0.5290823842917889 }, { "name": "model.layers.34.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1024810191884171e-05, "sensitivity": 1.2127970807378519 }, { "name": "model.layers.34.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2118470067434828e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006850915960967541, "sensitivity": 0.5190367251247088 }, { "name": "model.layers.34.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.891914770472795e-05, "sensitivity": 0.8671300125325141 }, { "name": "model.layers.34.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.526129254780244e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.901047188672237e-05, "sensitivity": 0.8509700505018893 }, { "name": "model.layers.34.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.284750270424411e-05, "sensitivity": 0.8290409910661871 }, { "name": "model.layers.34.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1059264579671435e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.19568454567343e-05, "sensitivity": 0.6343809655935064 }, { "name": "model.layers.34.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0026875871699303e-05, "sensitivity": 1.0101304439991818 }, { "name": "model.layers.34.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3151829989510588e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006810060003772378, "sensitivity": 0.5908925222330682 }, { "name": "model.layers.34.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0775014743558131e-05, "sensitivity": 1.3392129917040134 }, { "name": "model.layers.34.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.185024285012332e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006561427726410329, "sensitivity": 0.5528459900278957 }, { "name": "model.layers.34.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.00069072050973773, "sensitivity": 0.5241925577246288 }, { "name": "model.layers.34.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.296868602679751e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006842344300821424, "sensitivity": 0.5416831498821567 }, { "name": "model.layers.34.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.979105925594922e-06, "sensitivity": 1.2752642815505681 }, { "name": "model.layers.34.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.207587501994567e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006192241562530398, "sensitivity": 0.5811035863994551 }, { "name": "model.layers.34.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.31433431408368e-05, "sensitivity": 0.8938001750860358 }, { "name": "model.layers.34.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.217317943286616e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007066546240821481, "sensitivity": 0.5497553596587273 }, { "name": "model.layers.34.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006927845533937216, "sensitivity": 0.564905878651085 }, { "name": "model.layers.34.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.293171731565963e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006844573654234409, "sensitivity": 0.504330812489783 }, { "name": "model.layers.34.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.93304609740153e-05, "sensitivity": 0.7704084064297073 }, { "name": "model.layers.34.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0487851795915049e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008010459132492542, "sensitivity": 0.546825816272745 }, { "name": "model.layers.34.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000647950975690037, "sensitivity": 0.577251538452228 }, { "name": "model.layers.34.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.16106660800142e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006558466702699661, "sensitivity": 0.5326150193714356 }, { "name": "model.layers.34.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.150404078653082e-05, "sensitivity": 0.6459202577623311 }, { "name": "model.layers.34.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.19586012110085e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006856656400486827, "sensitivity": 0.5527380379123148 }, { "name": "model.layers.34.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.131624104455113e-05, "sensitivity": 1.0503990893228878 }, { "name": "model.layers.34.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1332252825013711e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006885865586809814, "sensitivity": 0.5524749200829137 }, { "name": "model.layers.34.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1041298421332613e-05, "sensitivity": 1.3824114948100967 }, { "name": "model.layers.34.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3797606470689061e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.67719507671427e-05, "sensitivity": 0.7142121584269976 }, { "name": "model.layers.34.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.886844494147226e-05, "sensitivity": 0.6000506419619632 }, { "name": "model.layers.34.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.644236686450313e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.60132897994481e-05, "sensitivity": 0.6244844662503733 }, { "name": "model.layers.34.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.364415457937866e-05, "sensitivity": 0.6925207173937462 }, { "name": "model.layers.34.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.600044114042248e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007013862486928701, "sensitivity": 0.5107935438276927 }, { "name": "model.layers.34.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.1033962992951274e-05, "sensitivity": 0.6066415628866513 }, { "name": "model.layers.34.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.752031478958088e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000683712016325444, "sensitivity": 0.5267787186835615 }, { "name": "model.layers.34.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006350462790578604, "sensitivity": 0.575240528874233 }, { "name": "model.layers.34.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.441274985671043e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006336045917123556, "sensitivity": 0.5936785020218015 }, { "name": "model.layers.34.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6771968957036734e-05, "sensitivity": 0.7487253114328934 }, { "name": "model.layers.34.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.561093641721527e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006328242598101497, "sensitivity": 0.5666541492314147 }, { "name": "model.layers.34.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.602384382858872e-05, "sensitivity": 0.610929069134685 }, { "name": "model.layers.34.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.855623493924213e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007826555520296097, "sensitivity": 0.527796878057574 }, { "name": "model.layers.34.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.778986426070333e-05, "sensitivity": 0.8510190091623739 }, { "name": "model.layers.34.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3185208445065655e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.986632070038468e-05, "sensitivity": 0.6598650346842574 }, { "name": "model.layers.34.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.468162635224871e-05, "sensitivity": 1.0822427346188923 }, { "name": "model.layers.34.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.632360959381913e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6571687309769914e-05, "sensitivity": 0.6256662928749623 }, { "name": "model.layers.34.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.963783769402653e-05, "sensitivity": 0.9233260325537411 }, { "name": "model.layers.34.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.799241868473473e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006859648856334388, "sensitivity": 0.5199387344913411 }, { "name": "model.layers.34.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0361922250012867e-05, "sensitivity": 1.60893549266336 }, { "name": "model.layers.34.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.432395593947149e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006375653902068734, "sensitivity": 0.5634235266640369 }, { "name": "model.layers.34.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.28558118478395e-05, "sensitivity": 0.7943029761258581 }, { "name": "model.layers.34.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.904118663442205e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006989878602325916, "sensitivity": 0.5293935511423185 }, { "name": "model.layers.34.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.369658512994647e-05, "sensitivity": 0.6297341304225218 }, { "name": "model.layers.34.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2179381201349315e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007171913748607039, "sensitivity": 0.5184104410166418 }, { "name": "model.layers.34.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0843216841749381e-05, "sensitivity": 1.550677434029636 }, { "name": "model.layers.34.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.040831875798176e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006653386517427862, "sensitivity": 0.5373979560286926 }, { "name": "model.layers.34.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.592248635366559e-05, "sensitivity": 0.778073973347031 }, { "name": "model.layers.34.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.952473535828176e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8247591368854046e-05, "sensitivity": 0.6984130742245582 }, { "name": "model.layers.34.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006957526202313602, "sensitivity": 0.5882787929222644 }, { "name": "model.layers.34.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.036822123358434e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006964132189750671, "sensitivity": 0.5382874787704783 }, { "name": "model.layers.34.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.937883906881325e-05, "sensitivity": 0.9176437850053456 }, { "name": "model.layers.34.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0718180192270665e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006613642908632755, "sensitivity": 0.5835282547770085 }, { "name": "model.layers.34.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.096890865592286e-05, "sensitivity": 0.782997204661427 }, { "name": "model.layers.34.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0377909802627983e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006891537341289222, "sensitivity": 0.5104784460412247 }, { "name": "model.layers.34.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.901340045966208e-05, "sensitivity": 0.8413793374456648 }, { "name": "model.layers.34.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2117359347030288e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006597561296075583, "sensitivity": 0.5486043686396302 }, { "name": "model.layers.34.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.284756091190502e-05, "sensitivity": 0.6467190021174656 }, { "name": "model.layers.34.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.857062650553416e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007035612361505628, "sensitivity": 0.5036219669388441 }, { "name": "model.layers.34.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.496087841398548e-06, "sensitivity": 1.2802674860081225 }, { "name": "model.layers.34.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.699597522834665e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006123132188804448, "sensitivity": 0.5232833314292852 }, { "name": "model.layers.34.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1089893632743042e-05, "sensitivity": 1.2796265002009344 }, { "name": "model.layers.34.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0497179800950107e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000686654238961637, "sensitivity": 0.5175298080048208 }, { "name": "model.layers.34.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.143735663499683e-05, "sensitivity": 0.8542935839694386 }, { "name": "model.layers.34.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.401264952022757e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007025508093647659, "sensitivity": 0.555459099062038 }, { "name": "model.layers.34.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.251924060052261e-05, "sensitivity": 1.0402341691725987 }, { "name": "model.layers.34.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.413503564952407e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007016884628683329, "sensitivity": 0.5288570292381354 }, { "name": "model.layers.34.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.026324626873247e-05, "sensitivity": 0.8735249455414812 }, { "name": "model.layers.34.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.27217411622405e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006938362494111061, "sensitivity": 0.5158565179578516 }, { "name": "model.layers.34.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7695469877216965e-05, "sensitivity": 1.0396036625372957 }, { "name": "model.layers.34.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.274718442800804e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006685964181087911, "sensitivity": 0.5876797986010103 }, { "name": "model.layers.34.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.02435611654073e-05, "sensitivity": 0.8306153375511661 }, { "name": "model.layers.34.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0204926184087526e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006916669080965221, "sensitivity": 0.5484602476199112 }, { "name": "model.layers.34.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.116371514508501e-05, "sensitivity": 0.6052211373571832 }, { "name": "model.layers.34.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.544749903194315e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006974179996177554, "sensitivity": 0.5060268771486348 }, { "name": "model.layers.34.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.543830047827214e-05, "sensitivity": 0.7537996899245423 }, { "name": "model.layers.34.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0005271633417578e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.83422151976265e-05, "sensitivity": 0.6761535158931652 }, { "name": "model.layers.34.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.083389598643407e-05, "sensitivity": 0.8061945577259915 }, { "name": "model.layers.34.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3191265679779463e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9778947615996e-05, "sensitivity": 0.6580110391886917 }, { "name": "model.layers.34.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.482884055003524e-05, "sensitivity": 0.6975968733266807 }, { "name": "model.layers.34.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.411093060407438e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007357471040450037, "sensitivity": 0.5170275108354271 }, { "name": "model.layers.34.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1005911801476032e-05, "sensitivity": 1.6338625723415996 }, { "name": "model.layers.34.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.2045790046831826e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.003624730510637e-05, "sensitivity": 0.6470221227632623 }, { "name": "model.layers.34.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.732463250751607e-05, "sensitivity": 0.7072371241068811 }, { "name": "model.layers.34.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.84883354754129e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006516308058053255, "sensitivity": 0.5857838814410701 }, { "name": "model.layers.34.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1378810086171143e-05, "sensitivity": 1.3955447646577073 }, { "name": "model.layers.34.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.950948995334329e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007179055246524513, "sensitivity": 0.5331753267975146 }, { "name": "model.layers.34.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0727528762072325e-05, "sensitivity": 0.6716579573480425 }, { "name": "model.layers.34.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.124002650016337e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006778436945751309, "sensitivity": 0.5326784350305463 }, { "name": "model.layers.34.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9245125157758594e-05, "sensitivity": 0.9428875190747008 }, { "name": "model.layers.34.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.302871267711453e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006735402857884765, "sensitivity": 0.5507324959933722 }, { "name": "model.layers.34.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.507039198462735e-06, "sensitivity": 2.0970869950921247 }, { "name": "model.layers.34.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.600389153594733e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007070069550536573, "sensitivity": 0.5111261610200137 }, { "name": "model.layers.34.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0395566278020851e-05, "sensitivity": 1.525396831324092 }, { "name": "model.layers.34.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0335578508602339e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006614046869799495, "sensitivity": 0.562880169423452 }, { "name": "model.layers.34.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.503005589460372e-06, "sensitivity": 2.097424581741419 }, { "name": "model.layers.34.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.11253962131741e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006903437897562981, "sensitivity": 0.544582694739254 }, { "name": "model.layers.34.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.826074240962043e-05, "sensitivity": 1.0958068901889895 }, { "name": "model.layers.34.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0837225090654101e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007977578788995743, "sensitivity": 0.5609254854730026 }, { "name": "model.layers.34.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.053931429050863e-05, "sensitivity": 0.9898514797225189 }, { "name": "model.layers.34.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.9216890905227046e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.148965621832758e-05, "sensitivity": 0.6751209108834287 }, { "name": "model.layers.34.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0086652764584869e-05, "sensitivity": 1.233090697740095 }, { "name": "model.layers.34.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.645238386226993e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.372654413804412e-05, "sensitivity": 0.8693394098708487 }, { "name": "model.layers.34.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7833207392832264e-05, "sensitivity": 1.0866062888477162 }, { "name": "model.layers.34.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0972896689054323e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006279895314946771, "sensitivity": 0.5542885000832942 }, { "name": "model.layers.34.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007126049022190273, "sensitivity": 0.5796585863412235 }, { "name": "model.layers.34.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.835926337269484e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007001174381002784, "sensitivity": 0.5115820567486947 }, { "name": "model.layers.34.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9799273003591225e-05, "sensitivity": 0.6901166560536101 }, { "name": "model.layers.34.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.846975679764e-07, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006782313575968146, "sensitivity": 0.5321935561105177 }, { "name": "model.layers.34.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1877155884576496e-05, "sensitivity": 1.4720899075842069 }, { "name": "model.layers.34.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2622472240764182e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.538846355397254e-05, "sensitivity": 0.6948403282946294 }, { "name": "model.layers.34.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 2.4884384401957504e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.1798055058752652e-06, "sensitivity": 2.101165805651614 }, { "name": "model.layers.34.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.8697804762268788e-06, "sensitivity": 10.0 }, { "name": "model.layers.34.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.5563781516902964e-06, "sensitivity": 2.1016828044447946 }, { "name": "model.layers.34.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 7.99723966338206e-06, "sensitivity": 2.2026844665975402 }, { "name": "model.layers.34.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00018199138867203146, "sensitivity": 0.9569487031581467 }, { "name": "model.layers.34.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.568809057062026e-05, "sensitivity": 1.4101238499095523 }, { "name": "model.layers.34.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.361348303267732e-05, "sensitivity": 0.709301810261124 }, { "name": "model.layers.34.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00029668156639672816, "sensitivity": 0.811892795330873 }, { "name": "model.layers.35.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.70618431083858e-05, "sensitivity": 1.0991253008030595 }, { "name": "model.layers.35.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1424307331253658e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006386045715771616, "sensitivity": 0.5335525931637266 }, { "name": "model.layers.35.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4359941714210436e-05, "sensitivity": 0.8840672425538806 }, { "name": "model.layers.35.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0359588031860767e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006100083119235933, "sensitivity": 0.5816245967245918 }, { "name": "model.layers.35.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0829574421222787e-05, "sensitivity": 1.3377334911122236 }, { "name": "model.layers.35.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5389603049698053e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.451339868362993e-05, "sensitivity": 0.6412481509987683 }, { "name": "model.layers.35.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.868312291568145e-05, "sensitivity": 1.0711933971764047 }, { "name": "model.layers.35.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.097270569516695e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006542782066389918, "sensitivity": 0.5487574227791796 }, { "name": "model.layers.35.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0156160897167865e-05, "sensitivity": 1.944065664453109 }, { "name": "model.layers.35.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.069057134372997e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.492334457812831e-05, "sensitivity": 0.7091742828328679 }, { "name": "model.layers.35.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.635496199829504e-05, "sensitivity": 0.8790567488155168 }, { "name": "model.layers.35.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1596533795454889e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006356982048600912, "sensitivity": 0.5505319843789369 }, { "name": "model.layers.35.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.678994395770133e-05, "sensitivity": 0.8683572425077949 }, { "name": "model.layers.35.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.068061217476497e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007849936373531818, "sensitivity": 0.5479522504023678 }, { "name": "model.layers.35.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.894468631595373e-05, "sensitivity": 0.7061949481807932 }, { "name": "model.layers.35.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.598537419857166e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006555598229169846, "sensitivity": 0.5196422105844097 }, { "name": "model.layers.35.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.440957804443315e-05, "sensitivity": 0.602746469228769 }, { "name": "model.layers.35.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.06949037976301e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007105536642484367, "sensitivity": 0.5385789417733174 }, { "name": "model.layers.35.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.474636029452085e-05, "sensitivity": 0.6050056071796563 }, { "name": "model.layers.35.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0398114227427868e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007124672411009669, "sensitivity": 0.5616764199483478 }, { "name": "model.layers.35.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.436184048652649e-05, "sensitivity": 0.861222477643339 }, { "name": "model.layers.35.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.071090537152486e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007195805665105581, "sensitivity": 0.5600039351904381 }, { "name": "model.layers.35.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.481646803673357e-05, "sensitivity": 0.7983123723549397 }, { "name": "model.layers.35.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2376494851196185e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006257315981201828, "sensitivity": 0.530401052892314 }, { "name": "model.layers.35.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0451653906784486e-05, "sensitivity": 1.218425074334331 }, { "name": "model.layers.35.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1715186474248185e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006462531164288521, "sensitivity": 0.5713204137268588 }, { "name": "model.layers.35.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.950669219600968e-05, "sensitivity": 0.6306298324093531 }, { "name": "model.layers.35.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.013080350276141e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006570501136593521, "sensitivity": 0.550030243653942 }, { "name": "model.layers.35.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0770933487219736e-05, "sensitivity": 0.6674083867765931 }, { "name": "model.layers.35.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.434892263016081e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000672280672006309, "sensitivity": 0.5418020566923357 }, { "name": "model.layers.35.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.994080856908113e-05, "sensitivity": 1.047286928775542 }, { "name": "model.layers.35.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1148380281156278e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006776444497518241, "sensitivity": 0.5382571641010755 }, { "name": "model.layers.35.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.070172856998397e-05, "sensitivity": 1.3469971518328334 }, { "name": "model.layers.35.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5214599216051283e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.882512414245866e-05, "sensitivity": 0.6422535228900591 }, { "name": "model.layers.35.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.795253673568368e-05, "sensitivity": 1.0409013292882752 }, { "name": "model.layers.35.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.068821120497887e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006542092887684703, "sensitivity": 0.5527116395836542 }, { "name": "model.layers.35.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0685384040698409e-05, "sensitivity": 1.541086537671292 }, { "name": "model.layers.35.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1337342584738508e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006532776169478893, "sensitivity": 0.5287220877439335 }, { "name": "model.layers.35.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0540707080508582e-05, "sensitivity": 1.6423746393701064 }, { "name": "model.layers.35.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.9834277484042104e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7545898016542196e-05, "sensitivity": 0.6551774347662053 }, { "name": "model.layers.35.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.01495812588837e-05, "sensitivity": 0.6493685725324408 }, { "name": "model.layers.35.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.29532496027241e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006920799496583641, "sensitivity": 0.5297903047925777 }, { "name": "model.layers.35.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0517060218262486e-05, "sensitivity": 1.3534203996318983 }, { "name": "model.layers.35.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.757563136896351e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006607254035770893, "sensitivity": 0.5512299377451171 }, { "name": "model.layers.35.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.256594158709049e-05, "sensitivity": 0.9339139943157201 }, { "name": "model.layers.35.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1900618801519158e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006116607692092657, "sensitivity": 0.5719359603830647 }, { "name": "model.layers.35.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.167267565615475e-05, "sensitivity": 0.7199065603192373 }, { "name": "model.layers.35.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.500907935944269e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006775010260753334, "sensitivity": 0.5813643743095401 }, { "name": "model.layers.35.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.080047387513332e-05, "sensitivity": 0.7637973135896469 }, { "name": "model.layers.35.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.265744213531434e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.058024519006722e-05, "sensitivity": 0.6153857307836802 }, { "name": "model.layers.35.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.278574437601492e-05, "sensitivity": 0.6374147595922813 }, { "name": "model.layers.35.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.560322501376504e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007133637554943562, "sensitivity": 0.5178222037043779 }, { "name": "model.layers.35.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007357698632404208, "sensitivity": 0.5652300718162229 }, { "name": "model.layers.35.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.701396948003094e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000732538930606097, "sensitivity": 0.521019440753647 }, { "name": "model.layers.35.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.811664595967159e-05, "sensitivity": 0.6763219496161457 }, { "name": "model.layers.35.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.730846280333935e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006698654033243656, "sensitivity": 0.5487278900108788 }, { "name": "model.layers.35.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.744825805071741e-05, "sensitivity": 0.786950600459317 }, { "name": "model.layers.35.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.886682619253406e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007577185751870275, "sensitivity": 0.5713144812745226 }, { "name": "model.layers.35.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.628553092014045e-05, "sensitivity": 0.7999795141096475 }, { "name": "model.layers.35.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.173339551831305e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.799225229769945e-05, "sensitivity": 0.6469353221347525 }, { "name": "model.layers.35.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006954201962798834, "sensitivity": 0.5873240417849551 }, { "name": "model.layers.35.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.347252335421217e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006952495314180851, "sensitivity": 0.5333934741700551 }, { "name": "model.layers.35.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.079291779315099e-05, "sensitivity": 0.8435514046241619 }, { "name": "model.layers.35.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4017900866747368e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.199085328262299e-05, "sensitivity": 0.6096661507292274 }, { "name": "model.layers.35.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006357368547469378, "sensitivity": 0.5638659784620561 }, { "name": "model.layers.35.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.581135944041307e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006415140233002603, "sensitivity": 0.546470574242871 }, { "name": "model.layers.35.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.115852046496002e-05, "sensitivity": 1.593687941152419 }, { "name": "model.layers.35.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.358795978187118e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.550576654262841e-05, "sensitivity": 0.9503877544323037 }, { "name": "model.layers.35.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.737843796145171e-05, "sensitivity": 0.7973802162586449 }, { "name": "model.layers.35.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1129008044008515e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007645506411790848, "sensitivity": 0.5672743738707933 }, { "name": "model.layers.35.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006870562210679054, "sensitivity": 0.5995171994737869 }, { "name": "model.layers.35.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1993320185865741e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006713428301736712, "sensitivity": 0.5391335303472728 }, { "name": "model.layers.35.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0993821888405364e-05, "sensitivity": 1.248577801088478 }, { "name": "model.layers.35.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2028760920657078e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006559576722793281, "sensitivity": 0.522490785380921 }, { "name": "model.layers.35.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7463264965917915e-05, "sensitivity": 1.1033267873658048 }, { "name": "model.layers.35.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.711975402140524e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006373663782142103, "sensitivity": 0.5328036127902328 }, { "name": "model.layers.35.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.092158946557902e-05, "sensitivity": 0.9498970113979277 }, { "name": "model.layers.35.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.215615932589571e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006796100060455501, "sensitivity": 0.5187139857414349 }, { "name": "model.layers.35.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.920112016610801e-05, "sensitivity": 0.7984818434758493 }, { "name": "model.layers.35.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0632263638399309e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006603614310733974, "sensitivity": 0.5231039432909949 }, { "name": "model.layers.35.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.2101764595136046e-05, "sensitivity": 0.609707986402257 }, { "name": "model.layers.35.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.286053348958376e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006028921343386173, "sensitivity": 0.5311876161612147 }, { "name": "model.layers.35.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9473150031408295e-05, "sensitivity": 0.7451729020679763 }, { "name": "model.layers.35.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.954061859687499e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006660178187303245, "sensitivity": 0.5171516642606113 }, { "name": "model.layers.35.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6319666327908635e-05, "sensitivity": 0.6794653749016638 }, { "name": "model.layers.35.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.898816415443434e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006338850362226367, "sensitivity": 0.5591249339564277 }, { "name": "model.layers.35.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.989064811728895e-05, "sensitivity": 0.6609322029408489 }, { "name": "model.layers.35.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.792647582187783e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006737876683473587, "sensitivity": 0.5442244715459172 }, { "name": "model.layers.35.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.060202187858522e-05, "sensitivity": 0.7114875667037105 }, { "name": "model.layers.35.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2097585795345367e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.235466910060495e-05, "sensitivity": 0.7725651026311318 }, { "name": "model.layers.35.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.106073124101385e-05, "sensitivity": 0.7129473992420127 }, { "name": "model.layers.35.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.105666115108761e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006691885646432638, "sensitivity": 0.5393813650654562 }, { "name": "model.layers.35.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.81150850141421e-05, "sensitivity": 1.091510395383787 }, { "name": "model.layers.35.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.375045806336857e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.577950600534678e-05, "sensitivity": 1.006115737219582 }, { "name": "model.layers.35.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.427732685348019e-05, "sensitivity": 0.8332704385087744 }, { "name": "model.layers.35.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4448098681896226e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006172447465360165, "sensitivity": 0.5940239237940906 }, { "name": "model.layers.35.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.778052582172677e-05, "sensitivity": 1.1529155944414513 }, { "name": "model.layers.35.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.8832631667464739e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006367457681335509, "sensitivity": 0.5852755029192445 }, { "name": "model.layers.35.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.5821725557761965e-06, "sensitivity": 2.097214945003743 }, { "name": "model.layers.35.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5941762967486284e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.359293911373243e-05, "sensitivity": 0.6555078010627673 }, { "name": "model.layers.35.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1505731890792958e-05, "sensitivity": 1.4939884584062102 }, { "name": "model.layers.35.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1689753591781482e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007119998335838318, "sensitivity": 0.5232148382310686 }, { "name": "model.layers.35.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0470320022432134e-05, "sensitivity": 1.00372107165827 }, { "name": "model.layers.35.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0677903219402651e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006696053314954042, "sensitivity": 0.5542800849817628 }, { "name": "model.layers.35.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5009899369906634e-05, "sensitivity": 0.709856922108981 }, { "name": "model.layers.35.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1569867410798906e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006622436339966953, "sensitivity": 0.5406980022220088 }, { "name": "model.layers.35.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006992264534346759, "sensitivity": 0.5841641530823175 }, { "name": "model.layers.35.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.081315516188624e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007071515428833663, "sensitivity": 0.5464882386945282 }, { "name": "model.layers.35.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.757948383688927e-05, "sensitivity": 0.8471379264065128 }, { "name": "model.layers.35.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.804370968893636e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000639239908196032, "sensitivity": 0.5511641448197959 }, { "name": "model.layers.35.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.130263606493827e-06, "sensitivity": 1.5889336382791874 }, { "name": "model.layers.35.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.57017766975332e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005977295222692192, "sensitivity": 0.578765967948971 }, { "name": "model.layers.35.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.64440914685838e-06, "sensitivity": 1.2212980736134367 }, { "name": "model.layers.35.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2424046644810005e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000597527134232223, "sensitivity": 0.5537179257818203 }, { "name": "model.layers.35.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.43511523574125e-05, "sensitivity": 0.8725337699400386 }, { "name": "model.layers.35.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.002697882147913e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006069475784897804, "sensitivity": 0.5498525465366291 }, { "name": "model.layers.35.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.014588143443689e-05, "sensitivity": 0.9962118748055571 }, { "name": "model.layers.35.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.216074906551512e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000675952760502696, "sensitivity": 0.5605988405876947 }, { "name": "model.layers.35.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0991370800184086e-05, "sensitivity": 1.7862676007467462 }, { "name": "model.layers.35.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.412592951055558e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006926755886524916, "sensitivity": 0.5804275417077893 }, { "name": "model.layers.35.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.919995601288974e-05, "sensitivity": 0.7234696589600151 }, { "name": "model.layers.35.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0597540267553995e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006775592337362468, "sensitivity": 0.5422542011982986 }, { "name": "model.layers.35.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.92062933719717e-05, "sensitivity": 1.1838927008434639 }, { "name": "model.layers.35.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.426816637234879e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006750643951818347, "sensitivity": 0.5496560364198025 }, { "name": "model.layers.35.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.046970884199254e-05, "sensitivity": 0.7322930448950298 }, { "name": "model.layers.35.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.348525059569511e-07, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007005219231359661, "sensitivity": 0.5624076877850529 }, { "name": "model.layers.35.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0574261068541091e-05, "sensitivity": 1.8026474699237967 }, { "name": "model.layers.35.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2840240515288315e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006399333942681551, "sensitivity": 0.5528825490988984 }, { "name": "model.layers.35.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 2.235860392829636e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.5634903977334034e-06, "sensitivity": 2.101996102787218 }, { "name": "model.layers.35.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.257424966956023e-06, "sensitivity": 10.0 }, { "name": "model.layers.35.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.5992445696610957e-06, "sensitivity": 2.1027581388642904 }, { "name": "model.layers.35.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 7.800614184816368e-06, "sensitivity": 2.1505106287123117 }, { "name": "model.layers.35.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00016956492618191987, "sensitivity": 0.9010917258888543 }, { "name": "model.layers.35.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.604637691343669e-05, "sensitivity": 1.6096531391260205 }, { "name": "model.layers.35.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 4.943474050378427e-05, "sensitivity": 0.7476913648792373 }, { "name": "model.layers.35.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00029013227322138846, "sensitivity": 0.7264488893333413 }, { "name": "model.layers.36.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.668676385539584e-05, "sensitivity": 0.9640336223432616 }, { "name": "model.layers.36.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3135334029357182e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.690589750884101e-05, "sensitivity": 0.7129996317690679 }, { "name": "model.layers.36.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.962895738775842e-05, "sensitivity": 0.8959729241275801 }, { "name": "model.layers.36.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1550600902410224e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006544087082147598, "sensitivity": 0.5465737048542805 }, { "name": "model.layers.36.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006941991741769016, "sensitivity": 0.5618890343884857 }, { "name": "model.layers.36.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.016852593238582e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007054070010781288, "sensitivity": 0.5440575995655275 }, { "name": "model.layers.36.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.849979061167687e-05, "sensitivity": 0.6721901546598549 }, { "name": "model.layers.36.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.203219881062978e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006776090594939888, "sensitivity": 0.564015622377662 }, { "name": "model.layers.36.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8748228184413165e-05, "sensitivity": 1.0874910130291084 }, { "name": "model.layers.36.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.7718875824357383e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006823347648605704, "sensitivity": 0.544625672887157 }, { "name": "model.layers.36.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.026951450621709e-05, "sensitivity": 0.8288769534324171 }, { "name": "model.layers.36.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.351092676799453e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006891156081110239, "sensitivity": 0.5348018241494691 }, { "name": "model.layers.36.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7759840274229646e-05, "sensitivity": 0.9884530292175214 }, { "name": "model.layers.36.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.165736193797784e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006851445650681853, "sensitivity": 0.5253703778888019 }, { "name": "model.layers.36.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0736946933320723e-05, "sensitivity": 1.329990892548208 }, { "name": "model.layers.36.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.962535634447704e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0854043113067746e-05, "sensitivity": 0.7292771622348906 }, { "name": "model.layers.36.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.918125680182129e-05, "sensitivity": 0.6897980767829062 }, { "name": "model.layers.36.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.246757031178277e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006582018686458468, "sensitivity": 0.546522356038087 }, { "name": "model.layers.36.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.670665268553421e-05, "sensitivity": 0.9675545780015022 }, { "name": "model.layers.36.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2413274816935882e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006358489627018571, "sensitivity": 0.5848587078668935 }, { "name": "model.layers.36.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0209178071818314e-05, "sensitivity": 1.238094149590065 }, { "name": "model.layers.36.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1642566732916748e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000635845004580915, "sensitivity": 0.5495772422687493 }, { "name": "model.layers.36.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.959994450677186e-05, "sensitivity": 0.715650550204975 }, { "name": "model.layers.36.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.02360388609668e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00067283830139786, "sensitivity": 0.5289990068362125 }, { "name": "model.layers.36.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3157599571277387e-06, "sensitivity": 2.0977221956395917 }, { "name": "model.layers.36.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.58927423399291e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.119477620813996e-05, "sensitivity": 0.6975604884095079 }, { "name": "model.layers.36.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.425456841592677e-06, "sensitivity": 2.098046124713189 }, { "name": "model.layers.36.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.518637304798176e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.202734948601574e-05, "sensitivity": 1.0308489715978004 }, { "name": "model.layers.36.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.852523463545367e-05, "sensitivity": 0.6419502694478354 }, { "name": "model.layers.36.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.341172719548922e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.827449422213249e-05, "sensitivity": 0.6040139246663586 }, { "name": "model.layers.36.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.639532901113853e-05, "sensitivity": 0.8996637134516249 }, { "name": "model.layers.36.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.865009254397592e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000627523404546082, "sensitivity": 0.5349962787419901 }, { "name": "model.layers.36.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.475596455857158e-05, "sensitivity": 0.9650248734060936 }, { "name": "model.layers.36.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0230453426629538e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000726040918380022, "sensitivity": 0.553827823526564 }, { "name": "model.layers.36.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.831756425322965e-05, "sensitivity": 0.821269856299335 }, { "name": "model.layers.36.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.615073738837964e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006716576172038913, "sensitivity": 0.5575229932450995 }, { "name": "model.layers.36.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0641556046903133e-05, "sensitivity": 0.7426177871863742 }, { "name": "model.layers.36.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0089460147355567e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.070926247048192e-05, "sensitivity": 0.607932400049435 }, { "name": "model.layers.36.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.181591743370518e-05, "sensitivity": 0.6420813982500548 }, { "name": "model.layers.36.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.0139344643394e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006894014659337699, "sensitivity": 0.5490337195876179 }, { "name": "model.layers.36.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0088554164394736e-05, "sensitivity": 0.6568147679207645 }, { "name": "model.layers.36.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.732601605108357e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.029329597367905e-05, "sensitivity": 0.6667319890844 }, { "name": "model.layers.36.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9565492847468704e-05, "sensitivity": 0.8450725999895237 }, { "name": "model.layers.36.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0169870847676066e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006585392984561622, "sensitivity": 0.5177990920734435 }, { "name": "model.layers.36.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.181406206451356e-05, "sensitivity": 0.8731819401306434 }, { "name": "model.layers.36.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.963933737504703e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007003047503530979, "sensitivity": 0.5343592213490982 }, { "name": "model.layers.36.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0459551958774682e-05, "sensitivity": 1.5242070768531772 }, { "name": "model.layers.36.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.995243211349589e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00061449920758605, "sensitivity": 0.5245936523537305 }, { "name": "model.layers.36.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.13287920714356e-05, "sensitivity": 1.0279960410641238 }, { "name": "model.layers.36.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.655916078874725e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006759327370673418, "sensitivity": 0.5324166055247583 }, { "name": "model.layers.36.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.54269169899635e-05, "sensitivity": 1.0468958389347323 }, { "name": "model.layers.36.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.017398517433321e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.700131052639335e-05, "sensitivity": 0.6666338358701549 }, { "name": "model.layers.36.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.908314389875159e-05, "sensitivity": 0.7435513493970665 }, { "name": "model.layers.36.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0590541705823853e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008159849676303566, "sensitivity": 0.539085835417511 }, { "name": "model.layers.36.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.720780973206274e-05, "sensitivity": 1.0398102006294323 }, { "name": "model.layers.36.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.132068731152685e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000634964439086616, "sensitivity": 0.5351771075419581 }, { "name": "model.layers.36.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000734447268769145, "sensitivity": 0.5902420603966676 }, { "name": "model.layers.36.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0472106168890605e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007385943899862468, "sensitivity": 0.528432508377599 }, { "name": "model.layers.36.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.369512993842363e-05, "sensitivity": 0.626051071577809 }, { "name": "model.layers.36.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.513865855595213e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006978057208471, "sensitivity": 0.5704271474252549 }, { "name": "model.layers.36.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.803361535887234e-06, "sensitivity": 1.810844067356358 }, { "name": "model.layers.36.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.111821555052302e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.2466290071606636e-05, "sensitivity": 0.7193675559089636 }, { "name": "model.layers.36.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.411189679056406e-05, "sensitivity": 1.1392373513882688 }, { "name": "model.layers.36.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.5912794272881e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007239388069137931, "sensitivity": 0.5337674047045035 }, { "name": "model.layers.36.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0678957551135682e-05, "sensitivity": 1.3845916073080906 }, { "name": "model.layers.36.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5112116216187133e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.807169509353116e-05, "sensitivity": 0.7384261230559778 }, { "name": "model.layers.36.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.096934885135852e-05, "sensitivity": 1.0661468892079558 }, { "name": "model.layers.36.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.601612873666454e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006818177062086761, "sensitivity": 0.5427217163177741 }, { "name": "model.layers.36.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0651125194272026e-05, "sensitivity": 1.4551886075307705 }, { "name": "model.layers.36.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.071320050679788e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006480823503807187, "sensitivity": 0.5387879346049439 }, { "name": "model.layers.36.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.775857425760478e-05, "sensitivity": 0.7334879943850212 }, { "name": "model.layers.36.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.22509912015812e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006380357663147151, "sensitivity": 0.5504078107132487 }, { "name": "model.layers.36.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.683056588168256e-05, "sensitivity": 0.7460235653442535 }, { "name": "model.layers.36.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.55738733207545e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006753659690730274, "sensitivity": 0.5410181399277114 }, { "name": "model.layers.36.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.459267024183646e-05, "sensitivity": 0.9157599125110993 }, { "name": "model.layers.36.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1399504273867933e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.43450184725225e-05, "sensitivity": 0.6242180440735996 }, { "name": "model.layers.36.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.50553340872284e-05, "sensitivity": 1.0206746389930885 }, { "name": "model.layers.36.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.125227057258599e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.3447511163540184e-05, "sensitivity": 0.6103149591029337 }, { "name": "model.layers.36.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0206290072528645e-05, "sensitivity": 0.811226410788321 }, { "name": "model.layers.36.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2025005844407133e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000680436089169234, "sensitivity": 0.5776488091202794 }, { "name": "model.layers.36.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5866890761535615e-05, "sensitivity": 0.7218844687080449 }, { "name": "model.layers.36.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.696295369896688e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000628418056294322, "sensitivity": 0.5626676524104116 }, { "name": "model.layers.36.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.356934318318963e-05, "sensitivity": 0.7412858081147318 }, { "name": "model.layers.36.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.549958240815613e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007178589585237205, "sensitivity": 0.5294890766676 }, { "name": "model.layers.36.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.221088859892916e-05, "sensitivity": 1.2375017165583162 }, { "name": "model.layers.36.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.71440988703398e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.570393063360825e-05, "sensitivity": 0.6789214208743111 }, { "name": "model.layers.36.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.945716839050874e-05, "sensitivity": 1.1024347223527429 }, { "name": "model.layers.36.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4030504189577186e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000662908423691988, "sensitivity": 0.5536401622840835 }, { "name": "model.layers.36.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.374837094976101e-06, "sensitivity": 2.0972730538820117 }, { "name": "model.layers.36.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.471066277910722e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006757731316611171, "sensitivity": 0.522009612229682 }, { "name": "model.layers.36.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4934679458965547e-06, "sensitivity": 2.098493137667436 }, { "name": "model.layers.36.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.3165548554970883e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.786112160421908e-05, "sensitivity": 1.067276960746323 }, { "name": "model.layers.36.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.23839077888988e-05, "sensitivity": 0.9489770706543199 }, { "name": "model.layers.36.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0761461908259662e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006839242996647954, "sensitivity": 0.5227470200263583 }, { "name": "model.layers.36.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.492462125606835e-05, "sensitivity": 0.7503371383309553 }, { "name": "model.layers.36.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.84104417511844e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007500160718336701, "sensitivity": 0.549507135386226 }, { "name": "model.layers.36.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.710976984119043e-05, "sensitivity": 1.0560574061590093 }, { "name": "model.layers.36.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.499116231381777e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9287453041179106e-05, "sensitivity": 0.7072378614230035 }, { "name": "model.layers.36.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.125147774582729e-05, "sensitivity": 1.0084038640783672 }, { "name": "model.layers.36.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.283530862878251e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006767324521206319, "sensitivity": 0.5314523208526389 }, { "name": "model.layers.36.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1257325240876526e-05, "sensitivity": 1.4118462914245062 }, { "name": "model.layers.36.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.0129555196035653e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.947204044787213e-05, "sensitivity": 0.6886529744873622 }, { "name": "model.layers.36.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006696636555716395, "sensitivity": 0.5494978121908493 }, { "name": "model.layers.36.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.125281283355434e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006698934594169259, "sensitivity": 0.5287469887521085 }, { "name": "model.layers.36.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.618872430408373e-05, "sensitivity": 0.6343835776202407 }, { "name": "model.layers.36.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.09311438590521e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007409563986584544, "sensitivity": 0.5355365947366015 }, { "name": "model.layers.36.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0988539543177467e-05, "sensitivity": 1.3624498787018338 }, { "name": "model.layers.36.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.250993571185973e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006748826126568019, "sensitivity": 0.5709995572723836 }, { "name": "model.layers.36.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0569000197574496e-05, "sensitivity": 0.8508277163514519 }, { "name": "model.layers.36.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0993385330948513e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006830545607954264, "sensitivity": 0.5903178761733927 }, { "name": "model.layers.36.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0384026609244756e-05, "sensitivity": 1.5259491511843795 }, { "name": "model.layers.36.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5623470517311944e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.532040086109191e-05, "sensitivity": 0.8592470903008779 }, { "name": "model.layers.36.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.882831464987248e-05, "sensitivity": 0.6484972197899835 }, { "name": "model.layers.36.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.028889849105326e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006585276569239795, "sensitivity": 0.5733988919231214 }, { "name": "model.layers.36.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.064047228283016e-05, "sensitivity": 1.365259427216087 }, { "name": "model.layers.36.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1592276223382214e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000634188880212605, "sensitivity": 0.5953594298887261 }, { "name": "model.layers.36.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0877275245729834e-05, "sensitivity": 0.6177985793417997 }, { "name": "model.layers.36.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.299274216165941e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006708285072818398, "sensitivity": 0.5507102626573779 }, { "name": "model.layers.36.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.2071599485352635e-05, "sensitivity": 1.3048750746124196 }, { "name": "model.layers.36.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.107966434385162e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007701545837335289, "sensitivity": 0.5619328214493994 }, { "name": "model.layers.36.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006736309151165187, "sensitivity": 0.5324677635138738 }, { "name": "model.layers.36.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.850726776974625e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006757138180546463, "sensitivity": 0.5409467330757185 }, { "name": "model.layers.36.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.189431587699801e-05, "sensitivity": 0.6587449613320135 }, { "name": "model.layers.36.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.022585820464883e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.212417792994529e-05, "sensitivity": 0.6263193559924018 }, { "name": "model.layers.36.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.482443505869014e-06, "sensitivity": 2.097130491516435 }, { "name": "model.layers.36.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.619687943995814e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.59232828184031e-05, "sensitivity": 0.6256681584751344 }, { "name": "model.layers.36.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.188780389493331e-05, "sensitivity": 1.086995745504538 }, { "name": "model.layers.36.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.80552852575056e-07, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.165164813864976e-05, "sensitivity": 0.632624958399351 }, { "name": "model.layers.36.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 2.135871454811422e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4085597942757886e-06, "sensitivity": 2.1033973578890737 }, { "name": "model.layers.36.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.9327427455427824e-06, "sensitivity": 10.0 }, { "name": "model.layers.36.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.6801866422611056e-06, "sensitivity": 2.1046438990440186 }, { "name": "model.layers.36.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 7.549389010819141e-06, "sensitivity": 2.1944605072919825 }, { "name": "model.layers.36.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00019526755204424262, "sensitivity": 1.1307676719923343 }, { "name": "model.layers.36.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.7418473362340592e-05, "sensitivity": 1.452552042528164 }, { "name": "model.layers.36.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.0748029025271535e-05, "sensitivity": 0.7665377373187339 }, { "name": "model.layers.36.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0003096478758379817, "sensitivity": 0.8873160293952393 }, { "name": "model.layers.37.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.302124812558759e-06, "sensitivity": 2.097452335337531 }, { "name": "model.layers.37.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.12417433228984e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.896820221096277e-05, "sensitivity": 0.7921372023782499 }, { "name": "model.layers.37.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.389175541698933e-05, "sensitivity": 0.7219127596064867 }, { "name": "model.layers.37.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.35949344693654e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000741355586796999, "sensitivity": 0.5568070985848861 }, { "name": "model.layers.37.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.5106193030951545e-05, "sensitivity": 0.6633723418220443 }, { "name": "model.layers.37.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.204024884937098e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006339214160107076, "sensitivity": 0.516335529400299 }, { "name": "model.layers.37.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7829216530080885e-05, "sensitivity": 0.7582129297948588 }, { "name": "model.layers.37.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.567717830170295e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006413698429241776, "sensitivity": 0.5507321083913294 }, { "name": "model.layers.37.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1128735422971658e-05, "sensitivity": 1.3700616603755014 }, { "name": "model.layers.37.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.747691365191713e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006818644469603896, "sensitivity": 0.5721479142177051 }, { "name": "model.layers.37.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6381861213594675e-05, "sensitivity": 0.9598977763178773 }, { "name": "model.layers.37.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.754584198162775e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006472060922533274, "sensitivity": 0.563560743996091 }, { "name": "model.layers.37.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.802956729894504e-05, "sensitivity": 1.0552206108301607 }, { "name": "model.layers.37.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.484796131189796e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00063495640642941, "sensitivity": 0.5410345943772726 }, { "name": "model.layers.37.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7586126786191016e-05, "sensitivity": 0.8605155551875342 }, { "name": "model.layers.37.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.273434216083842e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.792734009446576e-05, "sensitivity": 0.6996222121259377 }, { "name": "model.layers.37.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.2730108210234903e-05, "sensitivity": 1.264005302479709 }, { "name": "model.layers.37.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.041020141201443e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.654509681742638e-05, "sensitivity": 0.6666476808593517 }, { "name": "model.layers.37.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.025940820109099e-05, "sensitivity": 0.8626932921153915 }, { "name": "model.layers.37.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6035735370678594e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000711114495061338, "sensitivity": 0.5661815076716703 }, { "name": "model.layers.37.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3642824089620262e-06, "sensitivity": 2.0969615171880633 }, { "name": "model.layers.37.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.295581455451611e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006611902499571443, "sensitivity": 0.556768246469093 }, { "name": "model.layers.37.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.765238165622577e-05, "sensitivity": 0.6246352613889069 }, { "name": "model.layers.37.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.054606498968496e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006551609258167446, "sensitivity": 0.5439375638551006 }, { "name": "model.layers.37.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.094669151934795e-05, "sensitivity": 0.711999524484687 }, { "name": "model.layers.37.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.837141993149999e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006958224694244564, "sensitivity": 0.5570416800500859 }, { "name": "model.layers.37.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0699570894939825e-05, "sensitivity": 0.6824221586210265 }, { "name": "model.layers.37.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.990987225843128e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006769397296011448, "sensitivity": 0.5212081206000486 }, { "name": "model.layers.37.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.514830602100119e-05, "sensitivity": 0.6681365923450557 }, { "name": "model.layers.37.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.239202091113839e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000745285942684859, "sensitivity": 0.5445901282577901 }, { "name": "model.layers.37.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.27272334996087e-06, "sensitivity": 2.097196701441726 }, { "name": "model.layers.37.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.004353730939329e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.562891601584852e-05, "sensitivity": 0.6393174769851493 }, { "name": "model.layers.37.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.53853639960289e-05, "sensitivity": 0.7655649439565182 }, { "name": "model.layers.37.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.460768524149898e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007522036321461201, "sensitivity": 0.5305305803390639 }, { "name": "model.layers.37.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1116399946331512e-05, "sensitivity": 1.6397068868878408 }, { "name": "model.layers.37.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.749327318786527e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006732783513143659, "sensitivity": 0.5478337486025588 }, { "name": "model.layers.37.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4753678644628963e-06, "sensitivity": 2.0711763870655178 }, { "name": "model.layers.37.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0159860721614677e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000689714855980128, "sensitivity": 0.5221909400195582 }, { "name": "model.layers.37.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1366965736669954e-05, "sensitivity": 1.9609869586206166 }, { "name": "model.layers.37.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.865016995201586e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.302844849415123e-05, "sensitivity": 0.6168575310847293 }, { "name": "model.layers.37.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.230920553207397e-05, "sensitivity": 0.8498473773808541 }, { "name": "model.layers.37.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.943162927404046e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006923649925738573, "sensitivity": 0.5405471095811589 }, { "name": "model.layers.37.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006958985468372703, "sensitivity": 0.5297506409746597 }, { "name": "model.layers.37.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.649422061855148e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006998521275818348, "sensitivity": 0.5191337801130173 }, { "name": "model.layers.37.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.186944665387273e-05, "sensitivity": 0.8519602185680781 }, { "name": "model.layers.37.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.900416332835448e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000699941418133676, "sensitivity": 0.5428862868439883 }, { "name": "model.layers.37.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.083494680642616e-05, "sensitivity": 1.5297040600860812 }, { "name": "model.layers.37.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.491730116271356e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006959427846595645, "sensitivity": 0.5354872487826088 }, { "name": "model.layers.37.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.169309199322015e-05, "sensitivity": 0.8503140097137301 }, { "name": "model.layers.37.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.615719255227305e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006972586270421743, "sensitivity": 0.5284244582940595 }, { "name": "model.layers.37.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.093215360015165e-05, "sensitivity": 1.2212163005156236 }, { "name": "model.layers.37.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.656230991415214e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006491739768534899, "sensitivity": 0.5325524421734972 }, { "name": "model.layers.37.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.684213829226792e-05, "sensitivity": 0.6572863949051713 }, { "name": "model.layers.37.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.011159724839672e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006349403411149979, "sensitivity": 0.5605172066252299 }, { "name": "model.layers.37.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4441801542707253e-06, "sensitivity": 2.0980290268640456 }, { "name": "model.layers.37.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.8294484789294074e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.306679279077798e-05, "sensitivity": 0.7630241909422757 }, { "name": "model.layers.37.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000683446298353374, "sensitivity": 0.5718973273889251 }, { "name": "model.layers.37.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.713724923836708e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006748434971086681, "sensitivity": 0.5283168754136961 }, { "name": "model.layers.37.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7480603572912514e-05, "sensitivity": 1.0537997630210352 }, { "name": "model.layers.37.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4402638726096484e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0575919633265585e-05, "sensitivity": 0.7946288974825142 }, { "name": "model.layers.37.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.810303264297545e-05, "sensitivity": 0.6555779267110555 }, { "name": "model.layers.37.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2314778814470628e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006537241279147565, "sensitivity": 0.5862601638849012 }, { "name": "model.layers.37.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.2508464907296e-05, "sensitivity": 0.970509945816625 }, { "name": "model.layers.37.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0489645774214296e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006891717202961445, "sensitivity": 0.5156520844781036 }, { "name": "model.layers.37.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.067997310310602e-05, "sensitivity": 0.7992541945316728 }, { "name": "model.layers.37.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4284368035077932e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006770477630198002, "sensitivity": 0.5743152870027705 }, { "name": "model.layers.37.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.245107215363532e-05, "sensitivity": 0.719531326721042 }, { "name": "model.layers.37.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0509995718166465e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.127853703219444e-05, "sensitivity": 0.6477428766594358 }, { "name": "model.layers.37.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0660706720955204e-05, "sensitivity": 1.9710391840108836 }, { "name": "model.layers.37.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0091016520163976e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006412186776287854, "sensitivity": 0.5088055154310436 }, { "name": "model.layers.37.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7212608226109296e-05, "sensitivity": 0.9328043133181236 }, { "name": "model.layers.37.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.776209258736344e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006299125961959362, "sensitivity": 0.5842508073259671 }, { "name": "model.layers.37.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1167439879500307e-05, "sensitivity": 1.31137204304954 }, { "name": "model.layers.37.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2373210438454407e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.055086851119995e-05, "sensitivity": 0.6693938467451219 }, { "name": "model.layers.37.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0220627347007394e-05, "sensitivity": 0.8915977765906784 }, { "name": "model.layers.37.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.45181625411351e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006736153736710548, "sensitivity": 0.551629779007532 }, { "name": "model.layers.37.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.16139150224626e-05, "sensitivity": 0.6468572061501534 }, { "name": "model.layers.37.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.244876769618713e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006723962724208832, "sensitivity": 0.5142558823983778 }, { "name": "model.layers.37.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.187464896356687e-05, "sensitivity": 0.6911714096812139 }, { "name": "model.layers.37.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.134232434196747e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006845792522653937, "sensitivity": 0.5446161175166592 }, { "name": "model.layers.37.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.022815068718046e-05, "sensitivity": 0.9820657634935785 }, { "name": "model.layers.37.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.935732699275832e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006805739249102771, "sensitivity": 0.549917102827771 }, { "name": "model.layers.37.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0943853339995258e-05, "sensitivity": 1.7381985756819223 }, { "name": "model.layers.37.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.934478733455762e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.943485302850604e-05, "sensitivity": 0.6596687729967982 }, { "name": "model.layers.37.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9473088185768574e-05, "sensitivity": 0.8920275092829615 }, { "name": "model.layers.37.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.065453241419164e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006441720761358738, "sensitivity": 0.5462316276126933 }, { "name": "model.layers.37.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9827056247740984e-05, "sensitivity": 0.8005337985460637 }, { "name": "model.layers.37.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.123493332983344e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006594903534278274, "sensitivity": 0.5100425383967019 }, { "name": "model.layers.37.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1518297469592653e-05, "sensitivity": 1.3879762734429852 }, { "name": "model.layers.37.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.732941753602063e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007081359508447349, "sensitivity": 0.5644349857285658 }, { "name": "model.layers.37.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.193906301632524e-05, "sensitivity": 0.6873111121505817 }, { "name": "model.layers.37.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.269386514963116e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006802353891544044, "sensitivity": 0.5162391114177705 }, { "name": "model.layers.37.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4623807955067605e-05, "sensitivity": 0.9460798911165089 }, { "name": "model.layers.37.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6311605577357113e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.3069088608026505e-05, "sensitivity": 0.6393201690116905 }, { "name": "model.layers.37.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1639006515906658e-05, "sensitivity": 1.2235306861746142 }, { "name": "model.layers.37.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4959522331992048e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.429952918551862e-05, "sensitivity": 0.7281708606492134 }, { "name": "model.layers.37.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9246347518637776e-05, "sensitivity": 0.8100237819486493 }, { "name": "model.layers.37.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.569563417244353e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006421346915885806, "sensitivity": 0.5279682681546277 }, { "name": "model.layers.37.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.164993828861043e-05, "sensitivity": 0.825384085346361 }, { "name": "model.layers.37.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0138396646652836e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006927895592525601, "sensitivity": 0.5101231465199407 }, { "name": "model.layers.37.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.750307900598273e-05, "sensitivity": 0.7597483983713151 }, { "name": "model.layers.37.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.132627501960087e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006501316092908382, "sensitivity": 0.5273457405786252 }, { "name": "model.layers.37.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.846087515237741e-05, "sensitivity": 0.9236901214394716 }, { "name": "model.layers.37.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4352447124110768e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006698904326185584, "sensitivity": 0.5992858287529784 }, { "name": "model.layers.37.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.901986489538103e-05, "sensitivity": 0.7126783236756877 }, { "name": "model.layers.37.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.907125786412507e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008026680443435907, "sensitivity": 0.5459478657679557 }, { "name": "model.layers.37.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.273431790759787e-05, "sensitivity": 1.1847278515481288 }, { "name": "model.layers.37.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.45285001105367e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007479221094399691, "sensitivity": 0.5606961864213786 }, { "name": "model.layers.37.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.1140674562047934e-06, "sensitivity": 2.09707789146728 }, { "name": "model.layers.37.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.714534942555474e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 4.982907194062136e-05, "sensitivity": 0.6997687064355231 }, { "name": "model.layers.37.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.584209768334404e-05, "sensitivity": 0.7105042581769656 }, { "name": "model.layers.37.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.899263891886221e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007648984901607037, "sensitivity": 0.5424628158993285 }, { "name": "model.layers.37.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.311644392553717e-05, "sensitivity": 0.6009033639897583 }, { "name": "model.layers.37.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.685067657803302e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006962268380448222, "sensitivity": 0.5248251488921027 }, { "name": "model.layers.37.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7643057516543195e-05, "sensitivity": 0.9008569218404563 }, { "name": "model.layers.37.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.308702715316031e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6666780437808484e-05, "sensitivity": 0.7839186093973789 }, { "name": "model.layers.37.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.890681495657191e-05, "sensitivity": 0.6941545844308298 }, { "name": "model.layers.37.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.716875529695244e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006469757645390928, "sensitivity": 0.5265873871565041 }, { "name": "model.layers.37.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.2412100406654645e-06, "sensitivity": 2.097489371874163 }, { "name": "model.layers.37.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0800115433085011e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.3102463425602764e-05, "sensitivity": 1.0752350784577989 }, { "name": "model.layers.37.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9430945839267224e-05, "sensitivity": 0.6240700466467385 }, { "name": "model.layers.37.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.036154213186819e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006674231262877584, "sensitivity": 0.5516167955671343 }, { "name": "model.layers.37.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0733531427104026e-05, "sensitivity": 0.6602722870435423 }, { "name": "model.layers.37.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.240046215883922e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006778130773454905, "sensitivity": 0.5151939220837308 }, { "name": "model.layers.37.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.960347698419355e-05, "sensitivity": 0.9600211299643083 }, { "name": "model.layers.37.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.108719953270338e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006849092314951122, "sensitivity": 0.5286221778623037 }, { "name": "model.layers.37.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.893439083592966e-05, "sensitivity": 0.6586392020387694 }, { "name": "model.layers.37.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.780119742368697e-07, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006442448357120156, "sensitivity": 0.5424659202123847 }, { "name": "model.layers.37.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 2.0319412215030752e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.5518475013086572e-06, "sensitivity": 2.1031899015091904 }, { "name": "model.layers.37.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 3.1521030905423686e-06, "sensitivity": 10.0 }, { "name": "model.layers.37.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.59159299073508e-06, "sensitivity": 2.1044061654883115 }, { "name": "model.layers.37.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 7.091897714417428e-06, "sensitivity": 2.2035368899941923 }, { "name": "model.layers.37.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00019590994634199888, "sensitivity": 0.9431856680704118 }, { "name": "model.layers.37.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.425206119165523e-05, "sensitivity": 1.3999416397039393 }, { "name": "model.layers.37.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 2, "mse": 0.0006590730044990778, "sensitivity": 0.5898597784443735 }, { "name": "model.layers.37.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0003035494592040777, "sensitivity": 0.7966544857602197 }, { "name": "model.layers.38.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0736963304225355e-05, "sensitivity": 1.4450468119761855 }, { "name": "model.layers.38.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1331335372233298e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.870965833310038e-05, "sensitivity": 0.6737918066876849 }, { "name": "model.layers.38.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.063057662686333e-05, "sensitivity": 0.8598348090894042 }, { "name": "model.layers.38.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1859704045491526e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006938841543160379, "sensitivity": 0.5472672600634879 }, { "name": "model.layers.38.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4126607058860827e-06, "sensitivity": 2.0972644224919708 }, { "name": "model.layers.38.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.511306989727018e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007238363614305854, "sensitivity": 0.5279065111537898 }, { "name": "model.layers.38.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0728678363375366e-05, "sensitivity": 0.7704957850408932 }, { "name": "model.layers.38.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.331730552730733e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006947300862520933, "sensitivity": 0.5429552792631855 }, { "name": "model.layers.38.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.678594970959239e-05, "sensitivity": 0.9333033528226451 }, { "name": "model.layers.38.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1642458730420913e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.570552821154706e-05, "sensitivity": 0.6333797279466585 }, { "name": "model.layers.38.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1423270734667312e-05, "sensitivity": 1.967436677731432 }, { "name": "model.layers.38.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5442030871781753e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.082516483729705e-05, "sensitivity": 0.8879931041445531 }, { "name": "model.layers.38.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.811582013848238e-05, "sensitivity": 0.7997905184011174 }, { "name": "model.layers.38.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.061641321750358e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006506051868200302, "sensitivity": 0.5800605825678663 }, { "name": "model.layers.38.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.377868703566492e-05, "sensitivity": 0.6536306710330402 }, { "name": "model.layers.38.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.996768888711813e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007458789041265845, "sensitivity": 0.552765640176303 }, { "name": "model.layers.38.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0259142628638074e-05, "sensitivity": 0.6884224931963461 }, { "name": "model.layers.38.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.461678362436942e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000696134171448648, "sensitivity": 0.5129081050464646 }, { "name": "model.layers.38.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.561011832673103e-05, "sensitivity": 0.6264457918862952 }, { "name": "model.layers.38.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.929504815569089e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007240357808768749, "sensitivity": 0.5412743854788815 }, { "name": "model.layers.38.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006758588133379817, "sensitivity": 0.5482703139385345 }, { "name": "model.layers.38.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.677696546830703e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006702930550090969, "sensitivity": 0.5298997387460779 }, { "name": "model.layers.38.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0498922165425029e-05, "sensitivity": 1.7208293134417527 }, { "name": "model.layers.38.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.05564184247487e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006177224568091333, "sensitivity": 0.5778145635366704 }, { "name": "model.layers.38.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.383556319633499e-05, "sensitivity": 0.650148350434733 }, { "name": "model.layers.38.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.361405659547017e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007266210741363466, "sensitivity": 0.5254834461359391 }, { "name": "model.layers.38.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.280293746385723e-05, "sensitivity": 0.804707161420599 }, { "name": "model.layers.38.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.458293905277969e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006981625920161605, "sensitivity": 0.5814683516531027 }, { "name": "model.layers.38.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.380418926710263e-05, "sensitivity": 0.6336346515343672 }, { "name": "model.layers.38.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.381045179499779e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007400352042168379, "sensitivity": 0.5457607789702074 }, { "name": "model.layers.38.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.308348383754492e-05, "sensitivity": 0.7895229864661133 }, { "name": "model.layers.38.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.162410267686937e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006920917658135295, "sensitivity": 0.5414423890813646 }, { "name": "model.layers.38.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.17111218161881e-05, "sensitivity": 0.9261949515672412 }, { "name": "model.layers.38.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.448383030350669e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007183767738752067, "sensitivity": 0.5116324217371451 }, { "name": "model.layers.38.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.549419777002186e-05, "sensitivity": 0.6446354045413943 }, { "name": "model.layers.38.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.004338608065154e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007221675477921963, "sensitivity": 0.5822686108475714 }, { "name": "model.layers.38.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.869466986041516e-05, "sensitivity": 0.8778600361072899 }, { "name": "model.layers.38.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.868595043371897e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.166766252135858e-05, "sensitivity": 0.6145040325997222 }, { "name": "model.layers.38.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.915674410061911e-05, "sensitivity": 0.6713044429138317 }, { "name": "model.layers.38.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.456653972643835e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006673064781352878, "sensitivity": 0.5240878536480446 }, { "name": "model.layers.38.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.572407437488437e-05, "sensitivity": 0.6222399476011043 }, { "name": "model.layers.38.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.821663979892037e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007359473966062069, "sensitivity": 0.5371415374473388 }, { "name": "model.layers.38.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.703104397980496e-05, "sensitivity": 1.085422717291598 }, { "name": "model.layers.38.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.555099159617384e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006517720175907016, "sensitivity": 0.5528293805016399 }, { "name": "model.layers.38.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1577378245419823e-05, "sensitivity": 1.7077207007975004 }, { "name": "model.layers.38.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.164510856862762e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.203556404216215e-05, "sensitivity": 0.7083354980680456 }, { "name": "model.layers.38.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6880518968682736e-05, "sensitivity": 0.9325231815145922 }, { "name": "model.layers.38.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0176053137911367e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006210339488461614, "sensitivity": 0.5453678415415362 }, { "name": "model.layers.38.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.408622721210122e-05, "sensitivity": 0.611026328930356 }, { "name": "model.layers.38.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.731653113296488e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007151947356760502, "sensitivity": 0.5175118594333733 }, { "name": "model.layers.38.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.1031445511616766e-05, "sensitivity": 0.8050350946567719 }, { "name": "model.layers.38.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.510345080343541e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006841346621513367, "sensitivity": 0.5633464371178575 }, { "name": "model.layers.38.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.3143343393458053e-05, "sensitivity": 0.7645179687406712 }, { "name": "model.layers.38.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0193438129135757e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006647929549217224, "sensitivity": 0.5967343195817375 }, { "name": "model.layers.38.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.769041308667511e-05, "sensitivity": 0.7927742273244132 }, { "name": "model.layers.38.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.137312438004301e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9421050536911935e-05, "sensitivity": 0.6526393083462011 }, { "name": "model.layers.38.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7862838730216026e-05, "sensitivity": 0.9473071246328705 }, { "name": "model.layers.38.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.991072266122501e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.85821398999542e-05, "sensitivity": 0.7826239638919337 }, { "name": "model.layers.38.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.164536171127111e-05, "sensitivity": 0.6105057223448729 }, { "name": "model.layers.38.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.666500773164444e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006874680984765291, "sensitivity": 0.5786716442131148 }, { "name": "model.layers.38.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.196635513333604e-05, "sensitivity": 0.7532722795094581 }, { "name": "model.layers.38.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.961955811377265e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000682518701069057, "sensitivity": 0.5714278202388292 }, { "name": "model.layers.38.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.2158768186054658e-05, "sensitivity": 1.5966347617693764 }, { "name": "model.layers.38.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0647603403413086e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007416459266096354, "sensitivity": 0.5235640456118038 }, { "name": "model.layers.38.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006940662860870361, "sensitivity": 0.5618557854353237 }, { "name": "model.layers.38.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.60805436989176e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.192050932440907e-05, "sensitivity": 0.8173388486005975 }, { "name": "model.layers.38.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1720292604877613e-05, "sensitivity": 1.7655637718487405 }, { "name": "model.layers.38.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.750500117253978e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007173746707849205, "sensitivity": 0.5435131589486102 }, { "name": "model.layers.38.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.979033812764101e-05, "sensitivity": 1.135255361274395 }, { "name": "model.layers.38.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2596987062352127e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.2996417353861034e-05, "sensitivity": 1.9063396529536423 }, { "name": "model.layers.38.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.800568760605529e-05, "sensitivity": 0.7146855740234075 }, { "name": "model.layers.38.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0921083912762697e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0395701439119875e-05, "sensitivity": 0.7230410049783462 }, { "name": "model.layers.38.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.999011773383245e-05, "sensitivity": 0.9924456461320095 }, { "name": "model.layers.38.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.194724839289847e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.986793985357508e-05, "sensitivity": 0.6898269190014378 }, { "name": "model.layers.38.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006816412205807865, "sensitivity": 0.5752718719741018 }, { "name": "model.layers.38.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.284106343126041e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006688748835586011, "sensitivity": 0.5305661507782721 }, { "name": "model.layers.38.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.840432640979998e-05, "sensitivity": 0.7908319874086872 }, { "name": "model.layers.38.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.161337975958304e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006623369408771396, "sensitivity": 0.5650900944018682 }, { "name": "model.layers.38.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.522317223949358e-05, "sensitivity": 0.874938698699304 }, { "name": "model.layers.38.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.459506031817e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7271325204055756e-05, "sensitivity": 0.6488818234880716 }, { "name": "model.layers.38.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.22064180788584e-05, "sensitivity": 0.6225092133515171 }, { "name": "model.layers.38.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.114087353926152e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.233610474737361e-05, "sensitivity": 0.6140325260718644 }, { "name": "model.layers.38.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.801624840591103e-05, "sensitivity": 0.8182234792255381 }, { "name": "model.layers.38.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.894464258446533e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007674290100112557, "sensitivity": 0.5995419781952531 }, { "name": "model.layers.38.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.830479130963795e-05, "sensitivity": 0.8101819674126365 }, { "name": "model.layers.38.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.794924385962076e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006686918204650283, "sensitivity": 0.5775589901206843 }, { "name": "model.layers.38.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.046903945389204e-05, "sensitivity": 0.6401360978656252 }, { "name": "model.layers.38.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.115149855962954e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006707264110445976, "sensitivity": 0.5470896253240305 }, { "name": "model.layers.38.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1144637937832158e-05, "sensitivity": 1.2138131898756135 }, { "name": "model.layers.38.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.647925824334379e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006737086805514991, "sensitivity": 0.5272079686142046 }, { "name": "model.layers.38.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.897700692818034e-06, "sensitivity": 1.8399447774431854 }, { "name": "model.layers.38.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.195443473989144e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006632436998188496, "sensitivity": 0.5220072817727663 }, { "name": "model.layers.38.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.678798672510311e-05, "sensitivity": 0.6682461626713371 }, { "name": "model.layers.38.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2090803238606895e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007542503881268203, "sensitivity": 0.5239839144945017 }, { "name": "model.layers.38.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0863640101160854e-05, "sensitivity": 0.7556599921199358 }, { "name": "model.layers.38.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0096244977830793e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.927976962993853e-05, "sensitivity": 0.6249112004967459 }, { "name": "model.layers.38.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.176536408020183e-05, "sensitivity": 0.814277874146613 }, { "name": "model.layers.38.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1035315310437e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006802745047025383, "sensitivity": 0.5551582407974782 }, { "name": "model.layers.38.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.704093200620264e-05, "sensitivity": 0.7778790875137334 }, { "name": "model.layers.38.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.086074462364195e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006411084905266762, "sensitivity": 0.5432472540871147 }, { "name": "model.layers.38.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.818324279971421e-05, "sensitivity": 0.7338413233696585 }, { "name": "model.layers.38.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.402800636351458e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006578720058314502, "sensitivity": 0.5269159813730493 }, { "name": "model.layers.38.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.928318569203839e-05, "sensitivity": 0.9053979458792205 }, { "name": "model.layers.38.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.917759603515151e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.179577758302912e-05, "sensitivity": 0.8914989525133694 }, { "name": "model.layers.38.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.106749060563743e-05, "sensitivity": 0.6627390462730558 }, { "name": "model.layers.38.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.105386430339422e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006960115279071033, "sensitivity": 0.5304644745238295 }, { "name": "model.layers.38.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.87084102537483e-05, "sensitivity": 0.6550178697787897 }, { "name": "model.layers.38.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.397425628776546e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007630162872374058, "sensitivity": 0.5459293869206491 }, { "name": "model.layers.38.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1009549780283123e-05, "sensitivity": 1.2550138297930702 }, { "name": "model.layers.38.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.8839950826077256e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.587643292732537e-05, "sensitivity": 0.765763643119126 }, { "name": "model.layers.38.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1342013749526814e-05, "sensitivity": 1.2012000882374338 }, { "name": "model.layers.38.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2528583965831785e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007030301494523883, "sensitivity": 0.5622507603511799 }, { "name": "model.layers.38.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1798299965448678e-05, "sensitivity": 1.7084111376727675 }, { "name": "model.layers.38.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6336357475665864e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007041497156023979, "sensitivity": 0.5616675308516614 }, { "name": "model.layers.38.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007002138299867511, "sensitivity": 0.5290153853068132 }, { "name": "model.layers.38.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.02783552242181e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007168317097239196, "sensitivity": 0.5739676205701342 }, { "name": "model.layers.38.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1702543815772515e-05, "sensitivity": 1.3104003358901097 }, { "name": "model.layers.38.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.548892083126702e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007107759593054652, "sensitivity": 0.5229263627977203 }, { "name": "model.layers.38.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007367608486674726, "sensitivity": 0.5348070909796999 }, { "name": "model.layers.38.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.888032544338785e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007247903267852962, "sensitivity": 0.5585633946410412 }, { "name": "model.layers.38.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.093040039762855e-05, "sensitivity": 1.018133381045087 }, { "name": "model.layers.38.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1163078852405306e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000812046870123595, "sensitivity": 0.539915229174407 }, { "name": "model.layers.38.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.454921059324988e-06, "sensitivity": 2.0976757888695823 }, { "name": "model.layers.38.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2335585779510438e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007022731006145477, "sensitivity": 0.532231430008083 }, { "name": "model.layers.38.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6060780480038375e-05, "sensitivity": 1.0235226563667443 }, { "name": "model.layers.38.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.194548968276649e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006166922394186258, "sensitivity": 0.5507257267935605 }, { "name": "model.layers.38.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0579109584796242e-05, "sensitivity": 1.7146943020678687 }, { "name": "model.layers.38.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.357883416465484e-07, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006664595566689968, "sensitivity": 0.5543239991414078 }, { "name": "model.layers.38.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 1.9770945982600097e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.5424553768971236e-06, "sensitivity": 2.103727085689983 }, { "name": "model.layers.38.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 3.148520136164734e-06, "sensitivity": 10.0 }, { "name": "model.layers.38.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.6506267002114328e-06, "sensitivity": 2.1063539667222337 }, { "name": "model.layers.38.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 3.493807162158191e-05, "sensitivity": 1.9371376998954295 }, { "name": "model.layers.38.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00022416333376895636, "sensitivity": 0.8421219746571228 }, { "name": "model.layers.38.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.6650426914566197e-05, "sensitivity": 1.1718413829074892 }, { "name": "model.layers.38.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 2, "mse": 0.0006198073970153928, "sensitivity": 0.5865038575004429 }, { "name": "model.layers.38.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0003171184507664293, "sensitivity": 0.7989223125306852 }, { "name": "model.layers.39.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.476622754940763e-05, "sensitivity": 0.7100612746416621 }, { "name": "model.layers.39.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.140794645645656e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.648127626045607e-05, "sensitivity": 0.6524057645401786 }, { "name": "model.layers.39.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0538372407609131e-05, "sensitivity": 1.206694647969812 }, { "name": "model.layers.39.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.662712278033723e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006327390437945724, "sensitivity": 0.5244607854412868 }, { "name": "model.layers.39.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.211384607013315e-05, "sensitivity": 0.8091823695630146 }, { "name": "model.layers.39.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.918660796553013e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006852350197732449, "sensitivity": 0.5166797254341666 }, { "name": "model.layers.39.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.262149716145359e-05, "sensitivity": 0.6693471995226878 }, { "name": "model.layers.39.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.623521464163787e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006473431130871177, "sensitivity": 0.5398393426171926 }, { "name": "model.layers.39.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0703110648319125e-05, "sensitivity": 0.9533739002912123 }, { "name": "model.layers.39.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.748055281808774e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000656831543892622, "sensitivity": 0.5549131028197842 }, { "name": "model.layers.39.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006682753446511924, "sensitivity": 0.5912047287791475 }, { "name": "model.layers.39.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.752957233402412e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006577134481631219, "sensitivity": 0.5238076550286463 }, { "name": "model.layers.39.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.932372732786462e-05, "sensitivity": 0.7790726773759558 }, { "name": "model.layers.39.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.812831649469445e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.734008300350979e-05, "sensitivity": 0.6293440480377281 }, { "name": "model.layers.39.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006904881447553635, "sensitivity": 0.5432123620845792 }, { "name": "model.layers.39.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.753922315918317e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006968089728616178, "sensitivity": 0.5253282480979053 }, { "name": "model.layers.39.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 2.1473522792803124e-05, "sensitivity": 0.7930698346433771 }, { "name": "model.layers.39.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.115224560839124e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.4389831449079793e-05, "sensitivity": 1.3108654370863408 }, { "name": "model.layers.39.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0520644536882173e-05, "sensitivity": 1.3711253804553913 }, { "name": "model.layers.39.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3528127738027251e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.73063844058197e-05, "sensitivity": 0.6557413613889793 }, { "name": "model.layers.39.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.127559026936069e-05, "sensitivity": 0.643997713392706 }, { "name": "model.layers.39.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.864417739256169e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000683668302372098, "sensitivity": 0.5045415624879863 }, { "name": "model.layers.39.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006644650129601359, "sensitivity": 0.5573927013725228 }, { "name": "model.layers.39.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.684145089115191e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006450671935454011, "sensitivity": 0.5187871378924244 }, { "name": "model.layers.39.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.973321822239086e-05, "sensitivity": 0.704934521182819 }, { "name": "model.layers.39.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.78963453740289e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006597192259505391, "sensitivity": 0.5160457484352768 }, { "name": "model.layers.39.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.079169543227181e-05, "sensitivity": 0.8022650142507949 }, { "name": "model.layers.39.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.042226570774801e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006857478874735534, "sensitivity": 0.548207998958497 }, { "name": "model.layers.39.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006955274729989469, "sensitivity": 0.5680190199981747 }, { "name": "model.layers.39.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.36810272630828e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006839379202574492, "sensitivity": 0.5366654801834161 }, { "name": "model.layers.39.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9485097153810784e-05, "sensitivity": 1.0272079247369683 }, { "name": "model.layers.39.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.161619007296395e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006585874943993986, "sensitivity": 0.5656811778149674 }, { "name": "model.layers.39.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.266870332183316e-05, "sensitivity": 0.6142284635658392 }, { "name": "model.layers.39.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0610835943225538e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006683479296043515, "sensitivity": 0.5410522825960149 }, { "name": "model.layers.39.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.70434785913676e-05, "sensitivity": 0.9346192318594475 }, { "name": "model.layers.39.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.60811303734954e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.851740934303962e-05, "sensitivity": 0.6916749368442041 }, { "name": "model.layers.39.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.289083103183657e-05, "sensitivity": 0.6514957987878518 }, { "name": "model.layers.39.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.290964276762679e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.432915688492358e-05, "sensitivity": 0.6130050081736167 }, { "name": "model.layers.39.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.242296512937173e-05, "sensitivity": 0.7031621542359285 }, { "name": "model.layers.39.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.678588301336276e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.378129910444841e-05, "sensitivity": 0.7100494938585319 }, { "name": "model.layers.39.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007381384493783116, "sensitivity": 0.5774468796435133 }, { "name": "model.layers.39.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.804241022313363e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007333490066230297, "sensitivity": 0.5193006075985804 }, { "name": "model.layers.39.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0435429430799559e-05, "sensitivity": 1.3987483311705913 }, { "name": "model.layers.39.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0323344667995116e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0577607655432075e-05, "sensitivity": 0.8955970264849787 }, { "name": "model.layers.39.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1491849363665096e-05, "sensitivity": 1.665850294701982 }, { "name": "model.layers.39.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 3.170221589243738e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006805482553318143, "sensitivity": 0.5596758954636547 }, { "name": "model.layers.39.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.986378245230298e-06, "sensitivity": 1.8937587377268428 }, { "name": "model.layers.39.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3215703802416101e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.086035162094049e-05, "sensitivity": 0.8345954554645236 }, { "name": "model.layers.39.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0770621884148568e-05, "sensitivity": 1.2814017965208755 }, { "name": "model.layers.39.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.494630835935823e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006537455483339727, "sensitivity": 0.5970699044888687 }, { "name": "model.layers.39.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0423422837629914e-05, "sensitivity": 0.6227683503793028 }, { "name": "model.layers.39.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.98616383690387e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.198982009664178e-05, "sensitivity": 0.6833482509933733 }, { "name": "model.layers.39.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.023680907674134e-05, "sensitivity": 0.8269617170411199 }, { "name": "model.layers.39.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.481649385634228e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006717643700540066, "sensitivity": 0.5137886567469321 }, { "name": "model.layers.39.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006721188547089696, "sensitivity": 0.5938252827967154 }, { "name": "model.layers.39.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.990604444785276e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.04111046413891e-05, "sensitivity": 0.6408955522232588 }, { "name": "model.layers.39.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.7361356842448004e-06, "sensitivity": 2.043403886084076 }, { "name": "model.layers.39.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0014427971327677e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.925461639184505e-05, "sensitivity": 0.6079326658229092 }, { "name": "model.layers.39.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8652294683270156e-05, "sensitivity": 1.1065439537262416 }, { "name": "model.layers.39.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.393300620606169e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006562386406585574, "sensitivity": 0.5639461269711041 }, { "name": "model.layers.39.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007083863019943237, "sensitivity": 0.5529114478539646 }, { "name": "model.layers.39.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.899235813762061e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006930408999323845, "sensitivity": 0.5616893920714676 }, { "name": "model.layers.39.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.225090328371152e-05, "sensitivity": 0.8113280813529479 }, { "name": "model.layers.39.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.470771379303187e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.253809260670096e-05, "sensitivity": 0.7712066241099206 }, { "name": "model.layers.39.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1600927791732829e-05, "sensitivity": 1.2516683917041294 }, { "name": "model.layers.39.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.959716074561584e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006799572147428989, "sensitivity": 0.5438361846779335 }, { "name": "model.layers.39.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0600250789138954e-05, "sensitivity": 1.3243370687592704 }, { "name": "model.layers.39.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.345240303242463e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.119362999219447e-05, "sensitivity": 0.6046896564761632 }, { "name": "model.layers.39.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.448876618174836e-05, "sensitivity": 1.1911252153280665 }, { "name": "model.layers.39.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.438641548811574e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.4672229452989995e-05, "sensitivity": 0.6305648166994127 }, { "name": "model.layers.39.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1219084626645781e-05, "sensitivity": 1.2869700113300997 }, { "name": "model.layers.39.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.919267540681176e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006720914389006793, "sensitivity": 0.5513354820635449 }, { "name": "model.layers.39.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.655768083874136e-05, "sensitivity": 0.9031072482191946 }, { "name": "model.layers.39.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.071352244252921e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007671565981581807, "sensitivity": 0.5139005623911344 }, { "name": "model.layers.39.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.505981243913993e-05, "sensitivity": 0.7783680316009035 }, { "name": "model.layers.39.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0032263162429444e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005943889264017344, "sensitivity": 0.562977440384917 }, { "name": "model.layers.39.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9551093727350235e-05, "sensitivity": 1.1519919714173843 }, { "name": "model.layers.39.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2763093764078803e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.389725604094565e-05, "sensitivity": 0.6269457640661141 }, { "name": "model.layers.39.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0118163673905656e-05, "sensitivity": 0.8780587219607586 }, { "name": "model.layers.39.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.164872156157799e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006721747922711074, "sensitivity": 0.5327180638557969 }, { "name": "model.layers.39.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1105941666755825e-05, "sensitivity": 1.212706536766602 }, { "name": "model.layers.39.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.915624908288009e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006826884346082807, "sensitivity": 0.5174000358002846 }, { "name": "model.layers.39.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.184406083775684e-05, "sensitivity": 0.7013552858728911 }, { "name": "model.layers.39.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.733765414741356e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006869544158689678, "sensitivity": 0.5375295132409327 }, { "name": "model.layers.39.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.2240674297790974e-06, "sensitivity": 2.0973038619525926 }, { "name": "model.layers.39.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.98394511952938e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006719360826537013, "sensitivity": 0.551211231169531 }, { "name": "model.layers.39.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.625151581829414e-05, "sensitivity": 0.7921709592767918 }, { "name": "model.layers.39.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.837179734655365e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007439572364091873, "sensitivity": 0.5961308960590006 }, { "name": "model.layers.39.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.727499956265092e-05, "sensitivity": 0.8725677666147085 }, { "name": "model.layers.39.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.990274065785343e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006342043052427471, "sensitivity": 0.5294861475378808 }, { "name": "model.layers.39.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1400926268834155e-05, "sensitivity": 1.382493598680396 }, { "name": "model.layers.39.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.372045400989009e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.053807373973541e-05, "sensitivity": 0.7337771771169108 }, { "name": "model.layers.39.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7774515880737454e-05, "sensitivity": 0.7815003394631265 }, { "name": "model.layers.39.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1994748092547525e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006434351671487093, "sensitivity": 0.5981944598392975 }, { "name": "model.layers.39.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.646948920912109e-05, "sensitivity": 0.7369908125173755 }, { "name": "model.layers.39.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.640923851999105e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006283233524300158, "sensitivity": 0.545940575552214 }, { "name": "model.layers.39.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.0981829038646538e-06, "sensitivity": 2.0970718765438763 }, { "name": "model.layers.39.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.951515274522535e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7861427194438875e-05, "sensitivity": 0.6026762774925586 }, { "name": "model.layers.39.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.921417323406786e-05, "sensitivity": 0.8378957999059257 }, { "name": "model.layers.39.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.193703138204e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006554603460244834, "sensitivity": 0.49314366421501654 }, { "name": "model.layers.39.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0786752682179213e-05, "sensitivity": 1.2452967157671249 }, { "name": "model.layers.39.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0107200978382025e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.075889541534707e-05, "sensitivity": 0.6320838294192164 }, { "name": "model.layers.39.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.062581087462604e-05, "sensitivity": 1.0911652309922621 }, { "name": "model.layers.39.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.476967536807933e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006886426126584411, "sensitivity": 0.5446675780007126 }, { "name": "model.layers.39.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.724030779674649e-05, "sensitivity": 0.8387992189104132 }, { "name": "model.layers.39.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.817422667561914e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006621055072173476, "sensitivity": 0.5145803498293915 }, { "name": "model.layers.39.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.234316970221698e-05, "sensitivity": 0.8433676454876173 }, { "name": "model.layers.39.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.504972487964551e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.500181916635484e-05, "sensitivity": 0.6013117411086724 }, { "name": "model.layers.39.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.874373502796516e-05, "sensitivity": 0.6904920428135264 }, { "name": "model.layers.39.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0303363069397165e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007854144787415862, "sensitivity": 0.5303263720866759 }, { "name": "model.layers.39.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006808532634750009, "sensitivity": 0.5321442712418644 }, { "name": "model.layers.39.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.530355787821463e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.983895971439779e-05, "sensitivity": 0.6002345346811967 }, { "name": "model.layers.39.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1299083780613728e-05, "sensitivity": 1.2197915405592077 }, { "name": "model.layers.39.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.7910409724208876e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006881991284899414, "sensitivity": 0.5951311648450504 }, { "name": "model.layers.39.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007021564524620771, "sensitivity": 0.5895181583567696 }, { "name": "model.layers.39.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.887436138138582e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007092795567587018, "sensitivity": 0.5452753474011182 }, { "name": "model.layers.39.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.066477362764999e-05, "sensitivity": 0.6501283636861791 }, { "name": "model.layers.39.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.930823014452471e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006670200964435935, "sensitivity": 0.5631563706580901 }, { "name": "model.layers.39.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1048219676013105e-05, "sensitivity": 1.2079174434314417 }, { "name": "model.layers.39.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.335081022574741e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007050953572615981, "sensitivity": 0.5784771445204531 }, { "name": "model.layers.39.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006752251647412777, "sensitivity": 0.5125080509255288 }, { "name": "model.layers.39.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.54157588542148e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000665098603349179, "sensitivity": 0.5064372522714233 }, { "name": "model.layers.39.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 9.60523266257951e-06, "sensitivity": 1.8719539008965573 }, { "name": "model.layers.39.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.970683100211318e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0005875746719539165, "sensitivity": 0.5260312906544403 }, { "name": "model.layers.39.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.758394763688557e-05, "sensitivity": 0.7770837608394059 }, { "name": "model.layers.39.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.413449682440842e-07, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006510838866233826, "sensitivity": 0.5287501355776854 }, { "name": "model.layers.39.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.15068493061699e-05, "sensitivity": 0.6042068954172409 }, { "name": "model.layers.39.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1690462997648865e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006654210155829787, "sensitivity": 0.5854190036145648 }, { "name": "model.layers.39.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 1.8469082760930178e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.5433862447243882e-06, "sensitivity": 2.1043377456269607 }, { "name": "model.layers.39.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 3.165350335621042e-06, "sensitivity": 10.0 }, { "name": "model.layers.39.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.5586573454129393e-06, "sensitivity": 2.1054101712091966 }, { "name": "model.layers.39.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 4, "mse": 3.6057423130841926e-05, "sensitivity": 1.8086148419977652 }, { "name": "model.layers.39.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.000211276113986969, "sensitivity": 0.8069112452484706 }, { "name": "model.layers.39.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.752154275891371e-05, "sensitivity": 1.264455218254882 }, { "name": "model.layers.39.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 4.6707205910934135e-05, "sensitivity": 0.6667339867498504 }, { "name": "model.layers.39.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0003304955898784101, "sensitivity": 0.8798343819188216 }, { "name": "model.layers.40.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8121087931795046e-05, "sensitivity": 0.8178516364461677 }, { "name": "model.layers.40.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.341753527929541e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.962352952337824e-05, "sensitivity": 0.6812436505778894 }, { "name": "model.layers.40.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.405886233551428e-05, "sensitivity": 0.8736066557977898 }, { "name": "model.layers.40.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.959762792277616e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007012709975242615, "sensitivity": 0.5481768485665837 }, { "name": "model.layers.40.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.817396959173493e-05, "sensitivity": 0.9177336908885451 }, { "name": "model.layers.40.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.395125175615249e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.199230847414583e-05, "sensitivity": 0.7177849777709726 }, { "name": "model.layers.40.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.5113322408287786e-06, "sensitivity": 2.097809060723284 }, { "name": "model.layers.40.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0233904959022766e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000708649109583348, "sensitivity": 0.5353973386708811 }, { "name": "model.layers.40.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007038149051368237, "sensitivity": 0.5657141227728213 }, { "name": "model.layers.40.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.672929657725035e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006967965746298432, "sensitivity": 0.5287922694648037 }, { "name": "model.layers.40.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7869834563462064e-05, "sensitivity": 0.7075894401030691 }, { "name": "model.layers.40.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.526347189923399e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006654573371633887, "sensitivity": 0.527429576756727 }, { "name": "model.layers.40.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.737847459386103e-05, "sensitivity": 0.841907764806302 }, { "name": "model.layers.40.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.213694400183158e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006513843545690179, "sensitivity": 0.5163190298255367 }, { "name": "model.layers.40.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.621115608140826e-05, "sensitivity": 1.166857040449122 }, { "name": "model.layers.40.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2210372233312228e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.809942715335637e-05, "sensitivity": 0.6944964058575638 }, { "name": "model.layers.40.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.19883940089494e-05, "sensitivity": 0.6823616538286863 }, { "name": "model.layers.40.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.335016789511428e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006859757704660296, "sensitivity": 0.537409152042701 }, { "name": "model.layers.40.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.066107744118199e-05, "sensitivity": 1.1821976805641325 }, { "name": "model.layers.40.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.797085572747164e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006700476515106857, "sensitivity": 0.5874059759940562 }, { "name": "model.layers.40.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.625667836284265e-05, "sensitivity": 0.9408559566292883 }, { "name": "model.layers.40.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.814019227225799e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006354874931275845, "sensitivity": 0.5032430401995172 }, { "name": "model.layers.40.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.743294605053961e-05, "sensitivity": 1.052790293838426 }, { "name": "model.layers.40.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0851209708562237e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000644017243757844, "sensitivity": 0.5443894649166089 }, { "name": "model.layers.40.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.42257509753108e-05, "sensitivity": 0.873540188177285 }, { "name": "model.layers.40.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.513713621345232e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00074167107231915, "sensitivity": 0.5096240122157427 }, { "name": "model.layers.40.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1970626474067103e-05, "sensitivity": 1.3076308095874911 }, { "name": "model.layers.40.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.289802053695894e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007564167026430368, "sensitivity": 0.5654844866626042 }, { "name": "model.layers.40.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.871427129022777e-05, "sensitivity": 0.8801380603145604 }, { "name": "model.layers.40.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.724059744556143e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006581732886843383, "sensitivity": 0.5542626829707376 }, { "name": "model.layers.40.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006891795201227069, "sensitivity": 0.5460115770292574 }, { "name": "model.layers.40.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.923263408178173e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006830228376202285, "sensitivity": 0.5610455670300544 }, { "name": "model.layers.40.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.138946628198028e-05, "sensitivity": 0.8273367704431015 }, { "name": "model.layers.40.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.86518910445011e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006641907384619117, "sensitivity": 0.5247007686874113 }, { "name": "model.layers.40.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.592979480046779e-05, "sensitivity": 0.624622927790186 }, { "name": "model.layers.40.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1319635859763366e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.37564662611112e-05, "sensitivity": 0.6405328797655624 }, { "name": "model.layers.40.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.167396350065246e-05, "sensitivity": 0.9460566592544228 }, { "name": "model.layers.40.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2082720104444888e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007024985970929265, "sensitivity": 0.5835881133858595 }, { "name": "model.layers.40.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1857850040541962e-05, "sensitivity": 1.361629432937203 }, { "name": "model.layers.40.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4418841374208569e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.028022471582517e-05, "sensitivity": 0.785790759146431 }, { "name": "model.layers.40.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0854228094103746e-05, "sensitivity": 1.5195395785628663 }, { "name": "model.layers.40.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.952653848202317e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.991497164359316e-05, "sensitivity": 0.7290266965503246 }, { "name": "model.layers.40.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9892576246056706e-05, "sensitivity": 1.02604805685159 }, { "name": "model.layers.40.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1201180996067706e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006396970129571855, "sensitivity": 0.5653383470234207 }, { "name": "model.layers.40.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1049184649891686e-05, "sensitivity": 1.5032121094235942 }, { "name": "model.layers.40.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0839253263839055e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.860087912878953e-05, "sensitivity": 0.7716582170119777 }, { "name": "model.layers.40.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0773538280045614e-05, "sensitivity": 0.6146371628167426 }, { "name": "model.layers.40.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.59762473939918e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.958662222838029e-05, "sensitivity": 0.6343307621519229 }, { "name": "model.layers.40.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.885143036721274e-05, "sensitivity": 1.1576873430163013 }, { "name": "model.layers.40.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.590540687691828e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.839686491526663e-05, "sensitivity": 0.6288812532872442 }, { "name": "model.layers.40.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8698904467746615e-05, "sensitivity": 1.0926980244585291 }, { "name": "model.layers.40.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.802882914300426e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.958421388641e-05, "sensitivity": 0.716836638056771 }, { "name": "model.layers.40.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.436802505049855e-05, "sensitivity": 0.8627727070667928 }, { "name": "model.layers.40.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.178882697189692e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007029238040558994, "sensitivity": 0.5303473133785008 }, { "name": "model.layers.40.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.03547484590672e-05, "sensitivity": 0.7808772041245244 }, { "name": "model.layers.40.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0011483482230688e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.277500844793394e-05, "sensitivity": 0.6092796425528677 }, { "name": "model.layers.40.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1635862392722629e-05, "sensitivity": 1.8765914296092248 }, { "name": "model.layers.40.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2285989896554383e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.045298505341634e-05, "sensitivity": 0.6800174379388412 }, { "name": "model.layers.40.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.534165004268289e-05, "sensitivity": 0.6138151745338231 }, { "name": "model.layers.40.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.595785286364844e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.375550583470613e-05, "sensitivity": 0.6090123459742544 }, { "name": "model.layers.40.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.405618478311226e-05, "sensitivity": 0.7771500723526146 }, { "name": "model.layers.40.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.998283197390265e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.370826304191723e-05, "sensitivity": 0.6611920125826133 }, { "name": "model.layers.40.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.470950756920502e-05, "sensitivity": 0.7402160600942838 }, { "name": "model.layers.40.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.65752269874065e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007121765520423651, "sensitivity": 0.5262406588178846 }, { "name": "model.layers.40.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9131427406100556e-05, "sensitivity": 1.0450480074874315 }, { "name": "model.layers.40.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.615211987082148e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006784303113818169, "sensitivity": 0.5076655225368633 }, { "name": "model.layers.40.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.00066953751957044, "sensitivity": 0.5981714674928128 }, { "name": "model.layers.40.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.321957014028158e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006598655018024147, "sensitivity": 0.5150015882052565 }, { "name": "model.layers.40.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.331222539301962e-05, "sensitivity": 0.6799515348207157 }, { "name": "model.layers.40.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.074733616718731e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007255206583067775, "sensitivity": 0.5396972447882777 }, { "name": "model.layers.40.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0649231626302935e-05, "sensitivity": 1.2013060501174786 }, { "name": "model.layers.40.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0657497568899998e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000662231061141938, "sensitivity": 0.5835230230452935 }, { "name": "model.layers.40.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.335112993838266e-05, "sensitivity": 0.7985328444484188 }, { "name": "model.layers.40.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.684752745262813e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007147648138925433, "sensitivity": 0.5268945773934967 }, { "name": "model.layers.40.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.117508019087836e-05, "sensitivity": 0.9764783717783857 }, { "name": "model.layers.40.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.299889486806933e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006732306210324168, "sensitivity": 0.5491633004986703 }, { "name": "model.layers.40.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.084538598661311e-05, "sensitivity": 1.5505420896948876 }, { "name": "model.layers.40.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.115187029034132e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.919762043049559e-05, "sensitivity": 0.6542507819183647 }, { "name": "model.layers.40.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.77844402869232e-05, "sensitivity": 0.9222549567135176 }, { "name": "model.layers.40.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.162093440143508e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.095062053645961e-05, "sensitivity": 0.7993033849261499 }, { "name": "model.layers.40.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.110632911149878e-05, "sensitivity": 1.233408743851293 }, { "name": "model.layers.40.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.173001333489083e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006887412164360285, "sensitivity": 0.5169324847930068 }, { "name": "model.layers.40.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.023387686582282e-05, "sensitivity": 0.973138588350081 }, { "name": "model.layers.40.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.168816197605338e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9194349887548015e-05, "sensitivity": 0.9698673456943088 }, { "name": "model.layers.40.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8304907724959776e-05, "sensitivity": 1.088232713463895 }, { "name": "model.layers.40.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.875192065715964e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006586451781913638, "sensitivity": 0.547035609609048 }, { "name": "model.layers.40.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0197472875006497e-05, "sensitivity": 1.9635503452387377 }, { "name": "model.layers.40.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.05533104033384e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9086185501655564e-05, "sensitivity": 0.6715638016350524 }, { "name": "model.layers.40.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.345484871417284e-05, "sensitivity": 0.6238913693223482 }, { "name": "model.layers.40.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.398666639346629e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007017114548943937, "sensitivity": 0.5686855698649967 }, { "name": "model.layers.40.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0738589480752125e-05, "sensitivity": 1.3437427530026567 }, { "name": "model.layers.40.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0372672250014148e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006565612275153399, "sensitivity": 0.5674978475784388 }, { "name": "model.layers.40.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.086170469643548e-05, "sensitivity": 1.1473019232934123 }, { "name": "model.layers.40.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.977750442478282e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006583728827536106, "sensitivity": 0.5298015409645644 }, { "name": "model.layers.40.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.897074152017012e-05, "sensitivity": 0.7448653256615452 }, { "name": "model.layers.40.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.063354132696986e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7169992942363024e-05, "sensitivity": 0.6167614521796387 }, { "name": "model.layers.40.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.215028406586498e-05, "sensitivity": 0.8830384067041195 }, { "name": "model.layers.40.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.519475164168398e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.816719542257488e-05, "sensitivity": 0.6918792648676715 }, { "name": "model.layers.40.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1313239156152122e-05, "sensitivity": 1.3245784942565664 }, { "name": "model.layers.40.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1107989621450542e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.305113492999226e-05, "sensitivity": 0.8795836342420255 }, { "name": "model.layers.40.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.98431724938564e-05, "sensitivity": 1.097602858849579 }, { "name": "model.layers.40.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.095529213074769e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006672395393252373, "sensitivity": 0.5781743503029454 }, { "name": "model.layers.40.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.9321329899830744e-05, "sensitivity": 0.6032475544815349 }, { "name": "model.layers.40.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.072244893104653e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006813372019678354, "sensitivity": 0.5663149181457351 }, { "name": "model.layers.40.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1659830306598451e-05, "sensitivity": 1.4777859722793336 }, { "name": "model.layers.40.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.161877869701129e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000699371739756316, "sensitivity": 0.5844374951503545 }, { "name": "model.layers.40.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0464619663252961e-05, "sensitivity": 1.3999779194782118 }, { "name": "model.layers.40.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0131960834769416e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9983791288686916e-05, "sensitivity": 0.6358177653654509 }, { "name": "model.layers.40.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.857922562630847e-05, "sensitivity": 0.7578005549678414 }, { "name": "model.layers.40.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.861498261263478e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007855623844079673, "sensitivity": 0.5465149342490281 }, { "name": "model.layers.40.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.212333391886204e-05, "sensitivity": 1.0647942976089952 }, { "name": "model.layers.40.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.017292205091508e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000696613802574575, "sensitivity": 0.5248351170523925 }, { "name": "model.layers.40.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.204645615071058e-05, "sensitivity": 0.6693591780450092 }, { "name": "model.layers.40.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1130546226922888e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007024848600849509, "sensitivity": 0.5147688075540559 }, { "name": "model.layers.40.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.006411730486434e-05, "sensitivity": 1.840243065744812 }, { "name": "model.layers.40.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.875451046857052e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.087362999096513e-05, "sensitivity": 0.8620469024495363 }, { "name": "model.layers.40.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.252165621845052e-05, "sensitivity": 1.1594864129160005 }, { "name": "model.layers.40.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.97114751094341e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007060301722958684, "sensitivity": 0.5435561935695498 }, { "name": "model.layers.40.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.21348769729957e-05, "sensitivity": 0.9036305857699105 }, { "name": "model.layers.40.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0285029929946177e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.771463424433023e-05, "sensitivity": 0.7056960748806214 }, { "name": "model.layers.40.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.01276260567829e-05, "sensitivity": 0.6703623224317394 }, { "name": "model.layers.40.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.986882681303541e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006775002693757415, "sensitivity": 0.5062494810511531 }, { "name": "model.layers.40.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0480437241494656e-05, "sensitivity": 0.6302591640580998 }, { "name": "model.layers.40.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.253957387045375e-07, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006547748926095665, "sensitivity": 0.5370552251395093 }, { "name": "model.layers.40.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.777754631708376e-05, "sensitivity": 0.9732512828712033 }, { "name": "model.layers.40.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0575718079053331e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006484420737251639, "sensitivity": 0.5519115989116903 }, { "name": "model.layers.40.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.24459789833054e-05, "sensitivity": 0.7790472219652775 }, { "name": "model.layers.40.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.06054039861192e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007153379265218973, "sensitivity": 0.5517694204483428 }, { "name": "model.layers.40.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 1.7376695495840977e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.270014647365315e-06, "sensitivity": 2.1044663463852795 }, { "name": "model.layers.40.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 3.8911248338990845e-06, "sensitivity": 10.0 }, { "name": "model.layers.40.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.6376847042920417e-06, "sensitivity": 2.1060851780085037 }, { "name": "model.layers.40.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 7.248479505506111e-06, "sensitivity": 2.0740932415548965 }, { "name": "model.layers.40.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00017637867131270468, "sensitivity": 0.8819618728863331 }, { "name": "model.layers.40.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.3413685337582137e-05, "sensitivity": 1.9227917845277316 }, { "name": "model.layers.40.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 4.89735793962609e-05, "sensitivity": 0.6321370544899039 }, { "name": "model.layers.40.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.0002854735357686877, "sensitivity": 0.9108304140560908 }, { "name": "model.layers.41.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0014215705450624e-05, "sensitivity": 0.9473154958745369 }, { "name": "model.layers.41.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.368750516434375e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006826412281952798, "sensitivity": 0.5615932660774531 }, { "name": "model.layers.41.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.985827349126339e-05, "sensitivity": 0.8677240144072765 }, { "name": "model.layers.41.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.745276656758506e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007958390633575618, "sensitivity": 0.5958421844649806 }, { "name": "model.layers.41.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.39455538475886e-05, "sensitivity": 1.030727138647284 }, { "name": "model.layers.41.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.095807970676105e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006919209263287485, "sensitivity": 0.5394397701037097 }, { "name": "model.layers.41.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006539843743667006, "sensitivity": 0.5930950856305828 }, { "name": "model.layers.41.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.378641046467237e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006743529811501503, "sensitivity": 0.5070556522250319 }, { "name": "model.layers.41.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1018101758963894e-05, "sensitivity": 1.690785281404908 }, { "name": "model.layers.41.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2646893310375162e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.869124652235769e-05, "sensitivity": 0.6457012682702927 }, { "name": "model.layers.41.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1487334631965496e-05, "sensitivity": 1.4520926125768334 }, { "name": "model.layers.41.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.35863295631134e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006834515370428562, "sensitivity": 0.5858834536051551 }, { "name": "model.layers.41.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.694642459275201e-05, "sensitivity": 0.6613775481780347 }, { "name": "model.layers.41.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.395365173579194e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006464883335866034, "sensitivity": 0.5899191407678787 }, { "name": "model.layers.41.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.081832543713972e-05, "sensitivity": 0.6495739971000933 }, { "name": "model.layers.41.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.676117436654749e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006908971117809415, "sensitivity": 0.5268919054133152 }, { "name": "model.layers.41.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007100695511326194, "sensitivity": 0.5455223061547589 }, { "name": "model.layers.41.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.603985293120786e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006813002983108163, "sensitivity": 0.5218952503385224 }, { "name": "model.layers.41.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.736460298066959e-05, "sensitivity": 0.9049304283695938 }, { "name": "model.layers.41.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.068417400863837e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000680064782500267, "sensitivity": 0.5767533207514354 }, { "name": "model.layers.41.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.51246082270518e-05, "sensitivity": 1.178558103472682 }, { "name": "model.layers.41.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1255007166255382e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.405120802810416e-05, "sensitivity": 0.6288815176326439 }, { "name": "model.layers.41.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007343272445723414, "sensitivity": 0.547303608179574 }, { "name": "model.layers.41.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.548871275910642e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.37494886177592e-05, "sensitivity": 0.6119310724390556 }, { "name": "model.layers.41.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.4149921955540776e-06, "sensitivity": 2.097647856946052 }, { "name": "model.layers.41.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.023821596390917e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9262813010718673e-05, "sensitivity": 0.6283041249671761 }, { "name": "model.layers.41.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0685648350045085e-05, "sensitivity": 0.8280685856734893 }, { "name": "model.layers.41.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0769065283966484e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.145599036244676e-05, "sensitivity": 0.6893037925244163 }, { "name": "model.layers.41.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007029154803603888, "sensitivity": 0.5749125189940472 }, { "name": "model.layers.41.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.338878387803561e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007004638900980353, "sensitivity": 0.5196780525900908 }, { "name": "model.layers.41.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.291441241046414e-05, "sensitivity": 1.0309595490461942 }, { "name": "model.layers.41.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.072036277757434e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007307810592465103, "sensitivity": 0.5529302208551214 }, { "name": "model.layers.41.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.268854485824704e-05, "sensitivity": 0.743441305975727 }, { "name": "model.layers.41.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.832466053514509e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006851596990600228, "sensitivity": 0.5281637750457605 }, { "name": "model.layers.41.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.662749026669189e-05, "sensitivity": 1.0461958465232477 }, { "name": "model.layers.41.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0508447303436697e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.4691619880031794e-05, "sensitivity": 0.6473071977545304 }, { "name": "model.layers.41.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.096180732129142e-05, "sensitivity": 0.8275436160625628 }, { "name": "model.layers.41.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.201231480597926e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007133566541597247, "sensitivity": 0.5396382758944988 }, { "name": "model.layers.41.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.272321242140606e-05, "sensitivity": 1.2612463000026595 }, { "name": "model.layers.41.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1521103715494974e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007958944770507514, "sensitivity": 0.5412189673125579 }, { "name": "model.layers.41.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.376129749696702e-05, "sensitivity": 0.7163280057743239 }, { "name": "model.layers.41.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.043933459906839e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006823735311627388, "sensitivity": 0.5477793794954507 }, { "name": "model.layers.41.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000649435562081635, "sensitivity": 0.5813044986708081 }, { "name": "model.layers.41.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.289839001918153e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006251713493838906, "sensitivity": 0.5375317399326406 }, { "name": "model.layers.41.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6516757467761636e-05, "sensitivity": 0.9144496501318945 }, { "name": "model.layers.41.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0250623745378107e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.753510049544275e-05, "sensitivity": 0.628657909782834 }, { "name": "model.layers.41.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.797897756565362e-05, "sensitivity": 0.6080857899825619 }, { "name": "model.layers.41.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.753821253369097e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006689359433948994, "sensitivity": 0.5111914174731089 }, { "name": "model.layers.41.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0735151590779424e-05, "sensitivity": 1.3112428123900948 }, { "name": "model.layers.41.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0663924285836401e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.217809277586639e-05, "sensitivity": 0.7217420748556598 }, { "name": "model.layers.41.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.099191523389891e-05, "sensitivity": 0.9251190141845483 }, { "name": "model.layers.41.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.439097089445568e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007009552791714668, "sensitivity": 0.5296733226687214 }, { "name": "model.layers.41.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.039080835762434e-05, "sensitivity": 0.6026787071697873 }, { "name": "model.layers.41.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.023547254902951e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006704982370138168, "sensitivity": 0.5331517339497778 }, { "name": "model.layers.41.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.894645048305392e-05, "sensitivity": 0.9725525349363736 }, { "name": "model.layers.41.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.755474366102135e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.599515083711594e-05, "sensitivity": 0.6496344058506931 }, { "name": "model.layers.41.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1318118595227133e-05, "sensitivity": 1.3450392601713232 }, { "name": "model.layers.41.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.53812855691649e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.673176540061831e-05, "sensitivity": 0.7805528750821713 }, { "name": "model.layers.41.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.321809632936493e-05, "sensitivity": 0.9131967794635586 }, { "name": "model.layers.41.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.147396215463232e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006743567064404488, "sensitivity": 0.5178554647872098 }, { "name": "model.layers.41.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.450628279708326e-05, "sensitivity": 0.8405802045532068 }, { "name": "model.layers.41.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0784269761643372e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.156053859740496e-05, "sensitivity": 0.7676735747236455 }, { "name": "model.layers.41.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.704393308609724e-05, "sensitivity": 0.8794433583510991 }, { "name": "model.layers.41.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.016059059111285e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.72550086164847e-05, "sensitivity": 0.6118723014308544 }, { "name": "model.layers.41.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0055794165236875e-05, "sensitivity": 0.6033871816801845 }, { "name": "model.layers.41.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.964540600369219e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006741037359461188, "sensitivity": 0.5239293087266806 }, { "name": "model.layers.41.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.859525845153257e-05, "sensitivity": 0.6390266831767064 }, { "name": "model.layers.41.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.755515412100067e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000645384774543345, "sensitivity": 0.5556026804527863 }, { "name": "model.layers.41.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.898211384192109e-05, "sensitivity": 1.118577280586735 }, { "name": "model.layers.41.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1337796195221017e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006751897162757814, "sensitivity": 0.5446997867065309 }, { "name": "model.layers.41.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.5309807369922055e-06, "sensitivity": 2.0971843871821463 }, { "name": "model.layers.41.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5883800870142295e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0109596233814955e-05, "sensitivity": 0.7958065249428495 }, { "name": "model.layers.41.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006735351635143161, "sensitivity": 0.5540043465878912 }, { "name": "model.layers.41.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.609145088987134e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006709710578434169, "sensitivity": 0.5456628462388693 }, { "name": "model.layers.41.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.1278413340915e-05, "sensitivity": 0.7786273927542846 }, { "name": "model.layers.41.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.903718367037072e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006911371601745486, "sensitivity": 0.580349963398253 }, { "name": "model.layers.41.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.2554593215318164e-06, "sensitivity": 2.0660453725384755 }, { "name": "model.layers.41.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.142121504926763e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006270328303799033, "sensitivity": 0.5964012976267243 }, { "name": "model.layers.41.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.412077345885336e-05, "sensitivity": 0.7659197357327157 }, { "name": "model.layers.41.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.99056146863586e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.307669536909088e-05, "sensitivity": 0.635609956075893 }, { "name": "model.layers.41.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007079103961586952, "sensitivity": 0.580946567914994 }, { "name": "model.layers.41.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.63215837196185e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007227996829897165, "sensitivity": 0.5682448005563207 }, { "name": "model.layers.41.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.135553121566772e-05, "sensitivity": 0.6469623592317784 }, { "name": "model.layers.41.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.962138172639243e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007010043482296169, "sensitivity": 0.5273443730831106 }, { "name": "model.layers.41.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.261763337533921e-05, "sensitivity": 0.7503401429020842 }, { "name": "model.layers.41.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.994830528128659e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007137047359719872, "sensitivity": 0.5336408190456772 }, { "name": "model.layers.41.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7454322814010084e-05, "sensitivity": 0.6723554856876358 }, { "name": "model.layers.41.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.52287212687952e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000642994767986238, "sensitivity": 0.5107356692791247 }, { "name": "model.layers.41.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6050772400340065e-05, "sensitivity": 0.8837375497344869 }, { "name": "model.layers.41.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.552788924338529e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006891568191349506, "sensitivity": 0.5985433022683476 }, { "name": "model.layers.41.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1305367479508277e-05, "sensitivity": 1.2538808216875104 }, { "name": "model.layers.41.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1955032732657855e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006709459121339023, "sensitivity": 0.576176287293854 }, { "name": "model.layers.41.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.217109638673719e-05, "sensitivity": 1.2768486252227693 }, { "name": "model.layers.41.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.26046607724129e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007208720780909061, "sensitivity": 0.5077073710766574 }, { "name": "model.layers.41.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006913035176694393, "sensitivity": 0.5140819427416049 }, { "name": "model.layers.41.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.046321227084263e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006614301237277687, "sensitivity": 0.538192485331879 }, { "name": "model.layers.41.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.72855312586762e-05, "sensitivity": 0.7240514665270148 }, { "name": "model.layers.41.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.198171255775378e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007643825374543667, "sensitivity": 0.5463410404973734 }, { "name": "model.layers.41.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8245128457201645e-05, "sensitivity": 0.6328891291984046 }, { "name": "model.layers.41.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.560971428370976e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006481005111709237, "sensitivity": 0.5617556652009931 }, { "name": "model.layers.41.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.039664731360972e-05, "sensitivity": 0.7829448572995998 }, { "name": "model.layers.41.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.102524932633969e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006459177238866687, "sensitivity": 0.5251627198030586 }, { "name": "model.layers.41.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007044441881589592, "sensitivity": 0.5917143537571611 }, { "name": "model.layers.41.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.23705704533495e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000664009596221149, "sensitivity": 0.5249463023283387 }, { "name": "model.layers.41.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006909488001838326, "sensitivity": 0.5589949901260985 }, { "name": "model.layers.41.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.304964810828096e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006838515400886536, "sensitivity": 0.5198717568074016 }, { "name": "model.layers.41.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.7221430324716493e-05, "sensitivity": 0.664424028633191 }, { "name": "model.layers.41.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.780475700907118e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006915663834661245, "sensitivity": 0.5656743861791561 }, { "name": "model.layers.41.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.591388228116557e-05, "sensitivity": 0.6928039057835625 }, { "name": "model.layers.41.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.569071496822289e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007154032355174422, "sensitivity": 0.5810094878772014 }, { "name": "model.layers.41.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.478707655332983e-05, "sensitivity": 0.6569476283161445 }, { "name": "model.layers.41.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.350872692768462e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007135821506381035, "sensitivity": 0.5381796655413766 }, { "name": "model.layers.41.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.954498192295432e-05, "sensitivity": 0.6172877902238089 }, { "name": "model.layers.41.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.66999505685817e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006395004456862807, "sensitivity": 0.539054976939576 }, { "name": "model.layers.41.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.361599662341177e-05, "sensitivity": 1.0755950337738462 }, { "name": "model.layers.41.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.7849487221610616e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.060549276298843e-05, "sensitivity": 0.6828571506531207 }, { "name": "model.layers.41.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0684698837576434e-05, "sensitivity": 0.7683430818284114 }, { "name": "model.layers.41.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.663024916837458e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.22274455963634e-05, "sensitivity": 0.6007335473080094 }, { "name": "model.layers.41.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.13320547825424e-05, "sensitivity": 1.959106246380401 }, { "name": "model.layers.41.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5235598311846843e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.874672206118703e-05, "sensitivity": 0.7587259537372282 }, { "name": "model.layers.41.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.6269516790052876e-05, "sensitivity": 0.7978794170571842 }, { "name": "model.layers.41.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0523762057346175e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00063088140450418, "sensitivity": 0.5687902267250491 }, { "name": "model.layers.41.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.26073160674423e-05, "sensitivity": 0.9419534160888454 }, { "name": "model.layers.41.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.457751394213119e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007397853769361973, "sensitivity": 0.5399738374944919 }, { "name": "model.layers.41.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.518992449855432e-05, "sensitivity": 0.7480016361348932 }, { "name": "model.layers.41.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.433432299170818e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.44297688268125e-05, "sensitivity": 0.6198039728546172 }, { "name": "model.layers.41.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.26630790065974e-05, "sensitivity": 0.9781163455208365 }, { "name": "model.layers.41.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.155002089755726e-07, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006989313988015056, "sensitivity": 0.5702501135014564 }, { "name": "model.layers.41.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 1.6158246580744162e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.823588602041127e-06, "sensitivity": 2.1046306987645313 }, { "name": "model.layers.41.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.070756858709501e-06, "sensitivity": 10.0 }, { "name": "model.layers.41.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.6009091723390156e-06, "sensitivity": 2.105183120959502 }, { "name": "model.layers.41.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 1.136887749453308e-05, "sensitivity": 2.2299636904771125 }, { "name": "model.layers.41.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00016693651559762657, "sensitivity": 0.7437160278456537 }, { "name": "model.layers.41.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.937441629706882e-05, "sensitivity": 0.8174296001364302 }, { "name": "model.layers.41.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 4.936152254231274e-05, "sensitivity": 0.8506519673861413 }, { "name": "model.layers.41.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00021875753009226173, "sensitivity": 0.7663255807388758 }, { "name": "model.layers.42.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.841529855388217e-05, "sensitivity": 0.7957119149922822 }, { "name": "model.layers.42.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.555017186357873e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.7836685300571844e-05, "sensitivity": 0.7802066550944822 }, { "name": "model.layers.42.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0857602319447324e-05, "sensitivity": 1.3231470746963065 }, { "name": "model.layers.42.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1364725196472136e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006856260588392615, "sensitivity": 0.5900897995729383 }, { "name": "model.layers.42.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.515988206956536e-05, "sensitivity": 0.7260876352241864 }, { "name": "model.layers.42.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.886656021582894e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007187202572822571, "sensitivity": 0.5528980650929015 }, { "name": "model.layers.42.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007666065357625484, "sensitivity": 0.528838097454211 }, { "name": "model.layers.42.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.216026460810099e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007471974822692573, "sensitivity": 0.5441465076639755 }, { "name": "model.layers.42.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007185963913798332, "sensitivity": 0.5881133615464419 }, { "name": "model.layers.42.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.703962066647364e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006633991142734885, "sensitivity": 0.5642161365858734 }, { "name": "model.layers.42.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.29062342341058e-05, "sensitivity": 0.8787289554209534 }, { "name": "model.layers.42.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.932016382663278e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006909994408488274, "sensitivity": 0.5659151947853597 }, { "name": "model.layers.42.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.227577978279442e-05, "sensitivity": 0.7354239753439784 }, { "name": "model.layers.42.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.309768529419671e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006665278924629092, "sensitivity": 0.5279137781564828 }, { "name": "model.layers.42.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000695937080308795, "sensitivity": 0.5855078362591475 }, { "name": "model.layers.42.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.517912194998644e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006879447028040886, "sensitivity": 0.5472404529116469 }, { "name": "model.layers.42.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.414746167138219e-05, "sensitivity": 0.7043633264119538 }, { "name": "model.layers.42.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.343247029391932e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000697073875926435, "sensitivity": 0.5283186240394318 }, { "name": "model.layers.42.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.477203714894131e-05, "sensitivity": 1.018397678928106 }, { "name": "model.layers.42.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 3.3711173728079302e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.004391980241053e-05, "sensitivity": 0.6946895831136989 }, { "name": "model.layers.42.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.662727926392108e-05, "sensitivity": 0.8394184996414573 }, { "name": "model.layers.42.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.251550530578243e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.905995931243524e-05, "sensitivity": 0.9166191446612414 }, { "name": "model.layers.42.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.421824946301058e-05, "sensitivity": 0.7456914367254829 }, { "name": "model.layers.42.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.834805953483738e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0432001191657037e-05, "sensitivity": 0.6555380290921038 }, { "name": "model.layers.42.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.257584027480334e-05, "sensitivity": 0.6107202071242017 }, { "name": "model.layers.42.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.339013106706261e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006481194868683815, "sensitivity": 0.5281825312463373 }, { "name": "model.layers.42.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.959944585105404e-05, "sensitivity": 0.6704017326974941 }, { "name": "model.layers.42.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.895680482761236e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.001499034231529e-05, "sensitivity": 0.6582125270723204 }, { "name": "model.layers.42.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.36108306935057e-05, "sensitivity": 0.9112478715317222 }, { "name": "model.layers.42.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.492514436715282e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007152113830670714, "sensitivity": 0.548880267424116 }, { "name": "model.layers.42.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.6466185671743e-05, "sensitivity": 0.9620782011697538 }, { "name": "model.layers.42.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2219447853567544e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007017725147306919, "sensitivity": 0.5701031565689625 }, { "name": "model.layers.42.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0786619895952754e-05, "sensitivity": 1.6370386748362917 }, { "name": "model.layers.42.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.470371426483325e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.329223106149584e-05, "sensitivity": 0.8766514063870581 }, { "name": "model.layers.42.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.0390433999418747e-05, "sensitivity": 1.8971330840274092 }, { "name": "model.layers.42.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.385707251865824e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000717572052963078, "sensitivity": 0.524005473573515 }, { "name": "model.layers.42.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000722483906429261, "sensitivity": 0.5358038064562543 }, { "name": "model.layers.42.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.17668592389964e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007184402784332633, "sensitivity": 0.5431193168381769 }, { "name": "model.layers.42.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.912224150961265e-05, "sensitivity": 0.8943963056026272 }, { "name": "model.layers.42.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1317815733491443e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.064596527721733e-05, "sensitivity": 0.7890594121277295 }, { "name": "model.layers.42.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.321022374322638e-05, "sensitivity": 0.791861954959914 }, { "name": "model.layers.42.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.61006469676795e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006844158633612096, "sensitivity": 0.5198531686652696 }, { "name": "model.layers.42.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.351924093905836e-05, "sensitivity": 0.7490292203066264 }, { "name": "model.layers.42.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.64012180903228e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.877725197933614e-05, "sensitivity": 0.6816939039419588 }, { "name": "model.layers.42.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006681570084765553, "sensitivity": 0.5636357173950649 }, { "name": "model.layers.42.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.415692605012737e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006219518836587667, "sensitivity": 0.5466696186482577 }, { "name": "model.layers.42.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.152949936222285e-05, "sensitivity": 0.8327871896078628 }, { "name": "model.layers.42.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.41454379951756e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006963221239857376, "sensitivity": 0.5191804995441407 }, { "name": "model.layers.42.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007689629564993083, "sensitivity": 0.5384276379838014 }, { "name": "model.layers.42.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.824048111615411e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.017911411821842e-05, "sensitivity": 0.6959803595228109 }, { "name": "model.layers.42.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006938354927115142, "sensitivity": 0.5403219622669397 }, { "name": "model.layers.42.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.55552150621952e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.961046554148197e-05, "sensitivity": 0.6019468899995257 }, { "name": "model.layers.42.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.305998977040872e-05, "sensitivity": 0.7273146669004641 }, { "name": "model.layers.42.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.22104788969591e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.33803938399069e-05, "sensitivity": 0.7113421617490936 }, { "name": "model.layers.42.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007721766596660018, "sensitivity": 0.5969072642026748 }, { "name": "model.layers.42.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.15213411442528e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00076205690857023, "sensitivity": 0.5359761694038155 }, { "name": "model.layers.42.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.164881051518023e-05, "sensitivity": 0.6638906004262348 }, { "name": "model.layers.42.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.972930688993074e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006960458122193813, "sensitivity": 0.5242914073032128 }, { "name": "model.layers.42.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006955303251743317, "sensitivity": 0.5436855737811525 }, { "name": "model.layers.42.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.134125326047069e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006508738733828068, "sensitivity": 0.5575961127733322 }, { "name": "model.layers.42.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007137075299397111, "sensitivity": 0.547972069363834 }, { "name": "model.layers.42.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.795737815285975e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000734523287974298, "sensitivity": 0.5627470176692915 }, { "name": "model.layers.42.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.823950777994469e-05, "sensitivity": 0.8258675677818186 }, { "name": "model.layers.42.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.826755563655752e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006011682562530041, "sensitivity": 0.5549504582609434 }, { "name": "model.layers.42.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.605713133467361e-05, "sensitivity": 0.7247001641381936 }, { "name": "model.layers.42.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.078006317191466e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007018343894742429, "sensitivity": 0.5425029258117264 }, { "name": "model.layers.42.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.037659113644622e-05, "sensitivity": 0.6013140849024605 }, { "name": "model.layers.42.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.684772521723062e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006402776343747973, "sensitivity": 0.5639058525594804 }, { "name": "model.layers.42.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.265392585191876e-05, "sensitivity": 0.69808798491704 }, { "name": "model.layers.42.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.525641419510066e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006855819374322891, "sensitivity": 0.5636779892336032 }, { "name": "model.layers.42.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.000485154800117e-05, "sensitivity": 0.8315855166128107 }, { "name": "model.layers.42.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.46968079409271e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.875012720935047e-05, "sensitivity": 0.7898663136928536 }, { "name": "model.layers.42.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.211718573467806e-05, "sensitivity": 0.9524992934922878 }, { "name": "model.layers.42.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.573803501742077e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.97207433404401e-05, "sensitivity": 0.7449550418513916 }, { "name": "model.layers.42.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007294550305232406, "sensitivity": 0.5863101894099255 }, { "name": "model.layers.42.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.512640192748222e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.1832709787995555e-05, "sensitivity": 1.2076650356964242 }, { "name": "model.layers.42.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.461658631451428e-05, "sensitivity": 0.8718683314746938 }, { "name": "model.layers.42.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.115264694817597e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.653965101577342e-05, "sensitivity": 0.7542416297560929 }, { "name": "model.layers.42.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006800342234782875, "sensitivity": 0.5562639367676248 }, { "name": "model.layers.42.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.51461777529039e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006344640860334039, "sensitivity": 0.5823763621259959 }, { "name": "model.layers.42.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.914940604474396e-05, "sensitivity": 0.6028626362736123 }, { "name": "model.layers.42.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.888129402999766e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00078191002830863, "sensitivity": 0.5469874649809215 }, { "name": "model.layers.42.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.935208173468709e-05, "sensitivity": 0.9576644442246535 }, { "name": "model.layers.42.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.246539214771474e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.67234746995382e-05, "sensitivity": 0.8384764383667201 }, { "name": "model.layers.42.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.27351037110202e-05, "sensitivity": 0.7415633994582423 }, { "name": "model.layers.42.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.747560625328333e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006950628012418747, "sensitivity": 0.5781572522599896 }, { "name": "model.layers.42.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.437484989874065e-05, "sensitivity": 1.0622152745182751 }, { "name": "model.layers.42.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.007466132970876e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000747651734855026, "sensitivity": 0.5723989061936089 }, { "name": "model.layers.42.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0876183852087706e-05, "sensitivity": 1.0757531109824379 }, { "name": "model.layers.42.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.392846456838015e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006803018040955067, "sensitivity": 0.5555293420253357 }, { "name": "model.layers.42.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.892054468858987e-05, "sensitivity": 0.6553367277566738 }, { "name": "model.layers.42.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.074842756082944e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006392718642018735, "sensitivity": 0.555718772971481 }, { "name": "model.layers.42.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007037587347440422, "sensitivity": 0.5508363463536361 }, { "name": "model.layers.42.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.800029268561048e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.00070993322879076, "sensitivity": 0.5593918525934858 }, { "name": "model.layers.42.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.81035201321356e-05, "sensitivity": 0.7469523656929645 }, { "name": "model.layers.42.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.845213758628233e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.007660340401344e-05, "sensitivity": 0.6041161713793266 }, { "name": "model.layers.42.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.583704089280218e-05, "sensitivity": 0.618624454217352 }, { "name": "model.layers.42.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.799437066249084e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007455744780600071, "sensitivity": 0.5349158236653042 }, { "name": "model.layers.42.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006808197940699756, "sensitivity": 0.5590007216263808 }, { "name": "model.layers.42.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.248711083069793e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006570323603227735, "sensitivity": 0.540613283934085 }, { "name": "model.layers.42.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.975081512588076e-05, "sensitivity": 0.8079915376673483 }, { "name": "model.layers.42.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.318592108480516e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006532830884680152, "sensitivity": 0.5334090483291635 }, { "name": "model.layers.42.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.505313674802892e-05, "sensitivity": 0.9799445703558334 }, { "name": "model.layers.42.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.309932132353424e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006458432762883604, "sensitivity": 0.580839833936684 }, { "name": "model.layers.42.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.878613592358306e-05, "sensitivity": 0.7419170973464261 }, { "name": "model.layers.42.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.115983748917643e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006737703224644065, "sensitivity": 0.5604943083925737 }, { "name": "model.layers.42.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.76925337756984e-05, "sensitivity": 0.8186792980416899 }, { "name": "model.layers.42.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.989331945485901e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.710251909680665e-05, "sensitivity": 0.6302750791354621 }, { "name": "model.layers.42.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006861516740173101, "sensitivity": 0.5381081705944548 }, { "name": "model.layers.42.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.46274202154018e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006747896550223231, "sensitivity": 0.528479439052234 }, { "name": "model.layers.42.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.633331602439284e-05, "sensitivity": 0.8561472585214235 }, { "name": "model.layers.42.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0717322993514244e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.697547385352664e-05, "sensitivity": 0.6197759407107952 }, { "name": "model.layers.42.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.120010220911354e-05, "sensitivity": 0.6490091656429997 }, { "name": "model.layers.42.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.989336043261574e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006675642216578126, "sensitivity": 0.5446076036128218 }, { "name": "model.layers.42.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.913885590620339e-05, "sensitivity": 0.7692744737317054 }, { "name": "model.layers.42.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0495098194951424e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008000998641364276, "sensitivity": 0.5463566442848038 }, { "name": "model.layers.42.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.140126788523048e-05, "sensitivity": 0.7101571550729641 }, { "name": "model.layers.42.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1133117823192151e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006962978513911366, "sensitivity": 0.5464407792875435 }, { "name": "model.layers.42.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006499738665297627, "sensitivity": 0.538278870914285 }, { "name": "model.layers.42.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.978722240091884e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006463453755713999, "sensitivity": 0.5414925734759536 }, { "name": "model.layers.42.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006826870958320796, "sensitivity": 0.5134715668987958 }, { "name": "model.layers.42.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.437837439283612e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006878517451696098, "sensitivity": 0.5251434920696814 }, { "name": "model.layers.42.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.399252015398815e-05, "sensitivity": 0.6742922180024105 }, { "name": "model.layers.42.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.152152647904586e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.04131564614363e-05, "sensitivity": 0.6052462072394693 }, { "name": "model.layers.42.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000702015298884362, "sensitivity": 0.5505028175948089 }, { "name": "model.layers.42.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.06265313460608e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.241867959033698e-05, "sensitivity": 0.6591178680131635 }, { "name": "model.layers.42.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007171110482886434, "sensitivity": 0.5435028697729273 }, { "name": "model.layers.42.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.384289114677813e-07, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.256959022721276e-05, "sensitivity": 0.60003609787317 }, { "name": "model.layers.42.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 1.5517931615249836e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.920926933962619e-06, "sensitivity": 2.106015007032067 }, { "name": "model.layers.42.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.417030140757561e-06, "sensitivity": 10.0 }, { "name": "model.layers.42.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.9301337488286663e-06, "sensitivity": 2.1098198081230874 }, { "name": "model.layers.42.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 1.132014313043328e-05, "sensitivity": 2.2457080895309347 }, { "name": "model.layers.42.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.0002176280686398968, "sensitivity": 0.793304873611195 }, { "name": "model.layers.42.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.952105048985686e-05, "sensitivity": 0.8953795962904546 }, { "name": "model.layers.42.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 4.385049032862298e-05, "sensitivity": 0.7625087755739327 }, { "name": "model.layers.42.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 4, "mse": 5.0670485506998375e-05, "sensitivity": 1.3972905042165102 }, { "name": "model.layers.43.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007602049736306071, "sensitivity": 0.5464695601897201 }, { "name": "model.layers.43.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.337433428096119e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007353726541623473, "sensitivity": 0.5030598040757807 }, { "name": "model.layers.43.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.06094254180789e-05, "sensitivity": 0.7536802149272124 }, { "name": "model.layers.43.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.38350706797064e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006896990234963596, "sensitivity": 0.5193550616101942 }, { "name": "model.layers.43.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007068581762723625, "sensitivity": 0.5602133947865361 }, { "name": "model.layers.43.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.9241302703158e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000701389042660594, "sensitivity": 0.5321533061889326 }, { "name": "model.layers.43.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.807704630773515e-05, "sensitivity": 0.7223615614118086 }, { "name": "model.layers.43.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.157438742273371e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007702443981543183, "sensitivity": 0.5676283462769451 }, { "name": "model.layers.43.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007090584840625525, "sensitivity": 0.5413746051935067 }, { "name": "model.layers.43.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.687174274906283e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.915791552979499e-05, "sensitivity": 0.6041257305783041 }, { "name": "model.layers.43.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.254221079871058e-05, "sensitivity": 1.0066315656993803 }, { "name": "model.layers.43.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.186231070794747e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006527038640342653, "sensitivity": 0.5475471419099096 }, { "name": "model.layers.43.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007160776294767857, "sensitivity": 0.5363701662060172 }, { "name": "model.layers.43.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.08540812361025e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007149602752178907, "sensitivity": 0.5257473111849387 }, { "name": "model.layers.43.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.467907223850489e-05, "sensitivity": 0.8963638060860218 }, { "name": "model.layers.43.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1171466667292407e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006646484835073352, "sensitivity": 0.5481306627950793 }, { "name": "model.layers.43.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.538357411045581e-05, "sensitivity": 0.6059388669614247 }, { "name": "model.layers.43.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.766763587824244e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007532999152317643, "sensitivity": 0.5926591539709923 }, { "name": "model.layers.43.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.741487595718354e-05, "sensitivity": 0.6257929823890587 }, { "name": "model.layers.43.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.533026516488462e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007453775033354759, "sensitivity": 0.5379135006676337 }, { "name": "model.layers.43.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.10342831350863e-05, "sensitivity": 0.6558643182353636 }, { "name": "model.layers.43.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1285287655482534e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.17396435700357e-05, "sensitivity": 0.6386070806799791 }, { "name": "model.layers.43.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.862269947305322e-05, "sensitivity": 0.9213451491653574 }, { "name": "model.layers.43.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.445901246683206e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007488647825084627, "sensitivity": 0.5537965448976867 }, { "name": "model.layers.43.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.161590863484889e-05, "sensitivity": 0.9972387017984927 }, { "name": "model.layers.43.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.472339002059016e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006629893905483186, "sensitivity": 0.5376378700670619 }, { "name": "model.layers.43.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007105680997483432, "sensitivity": 0.5653131069497036 }, { "name": "model.layers.43.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.97127427176747e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007281664293259382, "sensitivity": 0.550759062377212 }, { "name": "model.layers.43.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006981519982218742, "sensitivity": 0.5604057494663626 }, { "name": "model.layers.43.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.401133868574107e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006430709036067128, "sensitivity": 0.5242284841051603 }, { "name": "model.layers.43.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1568177797016688e-05, "sensitivity": 1.368843722965875 }, { "name": "model.layers.43.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0594793593554641e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.30366412224248e-05, "sensitivity": 0.8832817933457103 }, { "name": "model.layers.43.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007135483319871128, "sensitivity": 0.5793563839924372 }, { "name": "model.layers.43.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5430555322382133e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.6403452617814764e-05, "sensitivity": 0.6305334829982305 }, { "name": "model.layers.43.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.449005741160363e-05, "sensitivity": 0.7602857496220393 }, { "name": "model.layers.43.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.3833094928704668e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.8849436754826456e-05, "sensitivity": 0.6839798995671371 }, { "name": "model.layers.43.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007157976506277919, "sensitivity": 0.5644498181291174 }, { "name": "model.layers.43.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.924401757009036e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007478293846361339, "sensitivity": 0.5141644954489499 }, { "name": "model.layers.43.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.356634548865259e-05, "sensitivity": 1.0135940340382508 }, { "name": "model.layers.43.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.50205992719566e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.630555435549468e-05, "sensitivity": 1.0000241133330823 }, { "name": "model.layers.43.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007199060055427253, "sensitivity": 0.5133961017423346 }, { "name": "model.layers.43.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.769479909962683e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007056538015604019, "sensitivity": 0.5156803968734944 }, { "name": "model.layers.43.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.446917541325092e-05, "sensitivity": 0.6237774514059087 }, { "name": "model.layers.43.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.29873897600919e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007185357389971614, "sensitivity": 0.55331479741186 }, { "name": "model.layers.43.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007423778297379613, "sensitivity": 0.5525429887297905 }, { "name": "model.layers.43.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.333818186656572e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.267482240218669e-05, "sensitivity": 0.6626891424340376 }, { "name": "model.layers.43.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.289585144259036e-05, "sensitivity": 0.8619085733716331 }, { "name": "model.layers.43.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0510084393899888e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007167309522628784, "sensitivity": 0.5487098095314373 }, { "name": "model.layers.43.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007487088441848755, "sensitivity": 0.5273298041748221 }, { "name": "model.layers.43.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.974442380349501e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007033213041722775, "sensitivity": 0.56133777505148 }, { "name": "model.layers.43.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.918281724210829e-05, "sensitivity": 0.9371596289247276 }, { "name": "model.layers.43.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.176014827971812e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007960271905176342, "sensitivity": 0.5845027696843041 }, { "name": "model.layers.43.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.557175220223144e-05, "sensitivity": 0.977231869711168 }, { "name": "model.layers.43.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0550286333455006e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007197223603725433, "sensitivity": 0.5806954006599391 }, { "name": "model.layers.43.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.395734817488119e-05, "sensitivity": 0.6771258165153251 }, { "name": "model.layers.43.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.752344342610741e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007044849917292595, "sensitivity": 0.5337903101258101 }, { "name": "model.layers.43.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.672403105767444e-05, "sensitivity": 0.6863695297004222 }, { "name": "model.layers.43.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.103785719664302e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007481633219867945, "sensitivity": 0.5669404839287818 }, { "name": "model.layers.43.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.53538154438138e-05, "sensitivity": 0.8721769667000383 }, { "name": "model.layers.43.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.656571364757838e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007436113664880395, "sensitivity": 0.5354187274845696 }, { "name": "model.layers.43.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1031595022359397e-05, "sensitivity": 1.2329938096450408 }, { "name": "model.layers.43.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2726829936582362e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5851705837994814e-05, "sensitivity": 0.9368064274905104 }, { "name": "model.layers.43.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.8756872022058815e-05, "sensitivity": 0.760092770990358 }, { "name": "model.layers.43.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.380410238511104e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006733516929671168, "sensitivity": 0.5587930697067868 }, { "name": "model.layers.43.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.370192568283528e-05, "sensitivity": 0.665298239345866 }, { "name": "model.layers.43.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.083666441256355e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006640083156526089, "sensitivity": 0.5822587982449973 }, { "name": "model.layers.43.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.089695307309739e-05, "sensitivity": 0.7528875012174574 }, { "name": "model.layers.43.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.079621238721302e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006406238535419106, "sensitivity": 0.5239892271278668 }, { "name": "model.layers.43.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007680892013013363, "sensitivity": 0.5543853898771702 }, { "name": "model.layers.43.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.038042551561375e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007518132915720344, "sensitivity": 0.5432214482838585 }, { "name": "model.layers.43.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.898112431168556e-05, "sensitivity": 0.6077859135103809 }, { "name": "model.layers.43.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.517292033298872e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006474503315985203, "sensitivity": 0.542046016694562 }, { "name": "model.layers.43.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.130761903477833e-05, "sensitivity": 0.6749887462028362 }, { "name": "model.layers.43.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.376518169621704e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006975022843107581, "sensitivity": 0.5608508737946268 }, { "name": "model.layers.43.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.67184212943539e-05, "sensitivity": 0.9606530548764715 }, { "name": "model.layers.43.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0551210607445682e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.722871330566704e-05, "sensitivity": 0.6360530259105807 }, { "name": "model.layers.43.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.94753834977746e-05, "sensitivity": 0.6452400470852713 }, { "name": "model.layers.43.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.9766118687985e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007584846462123096, "sensitivity": 0.5780167030969342 }, { "name": "model.layers.43.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.949484693701379e-05, "sensitivity": 0.614501102444877 }, { "name": "model.layers.43.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1742238257284043e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.190763087943196e-05, "sensitivity": 0.7541452833791258 }, { "name": "model.layers.43.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.644753739237785e-05, "sensitivity": 0.7484106990285906 }, { "name": "model.layers.43.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.796037829801207e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007211086340248585, "sensitivity": 0.5492890827850987 }, { "name": "model.layers.43.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.0088332247687504e-05, "sensitivity": 0.8724219081115563 }, { "name": "model.layers.43.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.704984798489022e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.9934693126706406e-05, "sensitivity": 0.6958862903906574 }, { "name": "model.layers.43.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.563553324667737e-05, "sensitivity": 0.666849751617395 }, { "name": "model.layers.43.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4452897403316456e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007203572895377874, "sensitivity": 0.5886464198280477 }, { "name": "model.layers.43.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007292439695447683, "sensitivity": 0.5598409669710303 }, { "name": "model.layers.43.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.565109854112961e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006779240211471915, "sensitivity": 0.5586268013533522 }, { "name": "model.layers.43.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.347454473143443e-05, "sensitivity": 0.677598079556423 }, { "name": "model.layers.43.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.626396604289766e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.47109845886007e-05, "sensitivity": 0.8458524243818664 }, { "name": "model.layers.43.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006744525162503123, "sensitivity": 0.5378248049130053 }, { "name": "model.layers.43.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.473017262782378e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006802569841966033, "sensitivity": 0.54822643097021 }, { "name": "model.layers.43.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.900752148590982e-05, "sensitivity": 0.8534019043796697 }, { "name": "model.layers.43.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.323776571865892e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006593801081180573, "sensitivity": 0.5697479580638655 }, { "name": "model.layers.43.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.608199328184128e-05, "sensitivity": 0.6235961677281738 }, { "name": "model.layers.43.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.617358844276168e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000712305773049593, "sensitivity": 0.5749446144309999 }, { "name": "model.layers.43.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007140818051993847, "sensitivity": 0.5451863119884042 }, { "name": "model.layers.43.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.106591735668189e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006562676280736923, "sensitivity": 0.5290953336154 }, { "name": "model.layers.43.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006725781131535769, "sensitivity": 0.5294181122957213 }, { "name": "model.layers.43.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.401941269970848e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006057674763724208, "sensitivity": 0.5383045994928395 }, { "name": "model.layers.43.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007404013886116445, "sensitivity": 0.573422582499427 }, { "name": "model.layers.43.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.434894536752836e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006949108792468905, "sensitivity": 0.5230779957151239 }, { "name": "model.layers.43.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007323437603190541, "sensitivity": 0.555107056432431 }, { "name": "model.layers.43.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.726052331236133e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006916522397659719, "sensitivity": 0.5310334142519224 }, { "name": "model.layers.43.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.631897849729285e-05, "sensitivity": 0.8954178522868191 }, { "name": "model.layers.43.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.006475920614321e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.788840983062983e-05, "sensitivity": 0.6576159871176783 }, { "name": "model.layers.43.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.4978074331302196e-05, "sensitivity": 0.7324365225999765 }, { "name": "model.layers.43.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.090043479569431e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.5197328038048e-05, "sensitivity": 0.7332859313985554 }, { "name": "model.layers.43.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000706388265825808, "sensitivity": 0.5852038501196448 }, { "name": "model.layers.43.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.316391474887496e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000722581404261291, "sensitivity": 0.5585825295713616 }, { "name": "model.layers.43.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.362442945828661e-05, "sensitivity": 0.7305398921976136 }, { "name": "model.layers.43.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 6.733836812600202e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006913202814757824, "sensitivity": 0.5271714962386383 }, { "name": "model.layers.43.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.350209878291935e-05, "sensitivity": 0.87788511650309 }, { "name": "model.layers.43.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.174170847662026e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006966536748223007, "sensitivity": 0.5218709503987016 }, { "name": "model.layers.43.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000765431672334671, "sensitivity": 0.5334983724962531 }, { "name": "model.layers.43.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.464427653758321e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007559815421700478, "sensitivity": 0.5192682092150792 }, { "name": "model.layers.43.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.75679839332588e-05, "sensitivity": 0.7006577170516504 }, { "name": "model.layers.43.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.118143018175033e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.555086292792112e-05, "sensitivity": 0.6240497560298713 }, { "name": "model.layers.43.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006942005711607635, "sensitivity": 0.5420111151428778 }, { "name": "model.layers.43.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.888038453529589e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006458614952862263, "sensitivity": 0.5297045682315391 }, { "name": "model.layers.43.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.3777238311595283e-06, "sensitivity": 2.097584030602833 }, { "name": "model.layers.43.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.569267831466277e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006334905629046261, "sensitivity": 0.563786487693265 }, { "name": "model.layers.43.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.464107718784362e-05, "sensitivity": 0.638451447858533 }, { "name": "model.layers.43.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.205649351111788e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.2693803000729531e-05, "sensitivity": 1.6068223093561085 }, { "name": "model.layers.43.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 5.739050538977608e-05, "sensitivity": 0.7349403502664091 }, { "name": "model.layers.43.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.775734497452504e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.775667887064628e-05, "sensitivity": 0.7023051144554664 }, { "name": "model.layers.43.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000741225085221231, "sensitivity": 0.556129578364327 }, { "name": "model.layers.43.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.10547612420487e-07, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007108502904884517, "sensitivity": 0.5593631462931187 }, { "name": "model.layers.43.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 1.506847752352769e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.968503738680738e-06, "sensitivity": 2.106978125585001 }, { "name": "model.layers.43.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.185621037322562e-06, "sensitivity": 10.0 }, { "name": "model.layers.43.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.6698617173460661e-06, "sensitivity": 2.1092339103152766 }, { "name": "model.layers.43.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 1.0488554835319519e-05, "sensitivity": 2.202904940453286 }, { "name": "model.layers.43.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00016809572116471827, "sensitivity": 0.8038724217385219 }, { "name": "model.layers.43.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.555923154228367e-05, "sensitivity": 0.9683457971495986 }, { "name": "model.layers.43.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 5.392429739004001e-05, "sensitivity": 0.668693971450738 }, { "name": "model.layers.43.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00025356863625347614, "sensitivity": 1.009493891432195 }, { "name": "model.layers.44.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.721816316712648e-05, "sensitivity": 0.6505045782807755 }, { "name": "model.layers.44.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1029678717022762e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007438661414198577, "sensitivity": 0.5528240209637193 }, { "name": "model.layers.44.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007144473493099213, "sensitivity": 0.5701729083047802 }, { "name": "model.layers.44.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.028917702380568e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006599724292755127, "sensitivity": 0.5508535517750209 }, { "name": "model.layers.44.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.275554187595844e-05, "sensitivity": 0.7965469779046492 }, { "name": "model.layers.44.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2340412922640098e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006909950170665979, "sensitivity": 0.5429912236380408 }, { "name": "model.layers.44.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.396927346941084e-05, "sensitivity": 0.8464221986356608 }, { "name": "model.layers.44.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0305855084880022e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.227615813259035e-05, "sensitivity": 0.6994166848156405 }, { "name": "model.layers.44.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.244799053296447e-05, "sensitivity": 0.6328697845871003 }, { "name": "model.layers.44.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0389820772616076e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007791281677782536, "sensitivity": 0.5419851668230082 }, { "name": "model.layers.44.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.718221993651241e-05, "sensitivity": 0.6893933567250712 }, { "name": "model.layers.44.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.825123490561964e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.26677501713857e-05, "sensitivity": 0.6942670243191869 }, { "name": "model.layers.44.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.690894952043891e-05, "sensitivity": 0.6421432807357237 }, { "name": "model.layers.44.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.83415930022602e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.585029041161761e-05, "sensitivity": 0.7138820151704328 }, { "name": "model.layers.44.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.131193367764354e-05, "sensitivity": 0.8956350050427091 }, { "name": "model.layers.44.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.938841690702247e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.374392978614196e-05, "sensitivity": 0.7058329270962431 }, { "name": "model.layers.44.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.62103047943674e-05, "sensitivity": 0.6780547557006654 }, { "name": "model.layers.44.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0438496929054963e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007035140879452229, "sensitivity": 0.545724195044324 }, { "name": "model.layers.44.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.296667172340676e-05, "sensitivity": 0.6396863835826716 }, { "name": "model.layers.44.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3356568615563447e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.750059012323618e-05, "sensitivity": 0.7308081306298588 }, { "name": "model.layers.44.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007417883607558906, "sensitivity": 0.5629377230059469 }, { "name": "model.layers.44.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.256982937382418e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007479933556169271, "sensitivity": 0.570133311496095 }, { "name": "model.layers.44.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.767684681108221e-05, "sensitivity": 0.8370400600689242 }, { "name": "model.layers.44.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.204756341001485e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007816435536369681, "sensitivity": 0.5120982723945207 }, { "name": "model.layers.44.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.736988143529743e-05, "sensitivity": 0.7336668493115764 }, { "name": "model.layers.44.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.598043450547266e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007070849533192813, "sensitivity": 0.5415163549213791 }, { "name": "model.layers.44.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000742375326808542, "sensitivity": 0.5500435236039959 }, { "name": "model.layers.44.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.237159019903629e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.0894131264649332e-05, "sensitivity": 1.2313641412289567 }, { "name": "model.layers.44.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007257721154019237, "sensitivity": 0.5585499546946778 }, { "name": "model.layers.44.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0495266451471252e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006369700422510505, "sensitivity": 0.5315488151272333 }, { "name": "model.layers.44.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.335852958727628e-05, "sensitivity": 0.9795409413602131 }, { "name": "model.layers.44.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.144749810729991e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.478999810293317e-05, "sensitivity": 0.6204275631611504 }, { "name": "model.layers.44.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007830878021195531, "sensitivity": 0.5738799422054301 }, { "name": "model.layers.44.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.848172339843586e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007468642434105277, "sensitivity": 0.5544485076594444 }, { "name": "model.layers.44.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.627313996432349e-05, "sensitivity": 0.644105959870115 }, { "name": "model.layers.44.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0271305654896423e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007289930945262313, "sensitivity": 0.5607562404609312 }, { "name": "model.layers.44.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007721954025328159, "sensitivity": 0.5515908613157806 }, { "name": "model.layers.44.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.196650694320851e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.806873716413975e-05, "sensitivity": 0.929522369090714 }, { "name": "model.layers.44.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007949993014335632, "sensitivity": 0.5275871646033481 }, { "name": "model.layers.44.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.124289590545231e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.654994649579749e-05, "sensitivity": 0.6430819425206679 }, { "name": "model.layers.44.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.59229772281833e-05, "sensitivity": 0.8316662776799173 }, { "name": "model.layers.44.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.386949505416851e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.39895151834935e-05, "sensitivity": 0.794329836304621 }, { "name": "model.layers.44.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.436893454520032e-05, "sensitivity": 0.6926282960702193 }, { "name": "model.layers.44.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.123044269974343e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.403076986316592e-05, "sensitivity": 0.7188266014676616 }, { "name": "model.layers.44.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.547794328071177e-05, "sensitivity": 0.8792033007484185 }, { "name": "model.layers.44.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.716622242995072e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.850815796293318e-05, "sensitivity": 0.7872208996920464 }, { "name": "model.layers.44.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000717272749170661, "sensitivity": 0.5382125644648024 }, { "name": "model.layers.44.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.935664368436846e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.846089334227145e-05, "sensitivity": 0.625244599403306 }, { "name": "model.layers.44.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007473204168491066, "sensitivity": 0.5239279682561628 }, { "name": "model.layers.44.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.998266250477172e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.158660835353658e-05, "sensitivity": 0.6388151685842007 }, { "name": "model.layers.44.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007195104262791574, "sensitivity": 0.5813269898479484 }, { "name": "model.layers.44.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.692317692293727e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.233198655536398e-05, "sensitivity": 0.6495061395144904 }, { "name": "model.layers.44.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007596053183078766, "sensitivity": 0.5453670883295056 }, { "name": "model.layers.44.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.818534524834831e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007286019972525537, "sensitivity": 0.5572768678515188 }, { "name": "model.layers.44.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008138448465615511, "sensitivity": 0.5679372511871077 }, { "name": "model.layers.44.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.475268143432913e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007643378339707851, "sensitivity": 0.5404592159465169 }, { "name": "model.layers.44.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.257896929018898e-05, "sensitivity": 1.219219530878525 }, { "name": "model.layers.44.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0628253903632867e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.543216295540333e-05, "sensitivity": 0.6299688014563213 }, { "name": "model.layers.44.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008144670864567161, "sensitivity": 0.5988046616131331 }, { "name": "model.layers.44.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2030363905068953e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007409557001665235, "sensitivity": 0.5538817924914536 }, { "name": "model.layers.44.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007529780268669128, "sensitivity": 0.5540609948291979 }, { "name": "model.layers.44.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0041035238828044e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006747780134901404, "sensitivity": 0.5362102247348453 }, { "name": "model.layers.44.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007039912743493915, "sensitivity": 0.5944380168765397 }, { "name": "model.layers.44.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0169318329644739e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006306021241471171, "sensitivity": 0.5685900808691268 }, { "name": "model.layers.44.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.590255361516029e-05, "sensitivity": 0.6908208112646494 }, { "name": "model.layers.44.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2492989753809525e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006820781854912639, "sensitivity": 0.5483611966661613 }, { "name": "model.layers.44.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.79271761327982e-05, "sensitivity": 0.7945173531893566 }, { "name": "model.layers.44.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.816491572360974e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007297940319404006, "sensitivity": 0.525159262570055 }, { "name": "model.layers.44.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007416746811941266, "sensitivity": 0.5236726085323328 }, { "name": "model.layers.44.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.264289246857516e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006893199752084911, "sensitivity": 0.5369244686755701 }, { "name": "model.layers.44.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.791971827624366e-05, "sensitivity": 0.620601214677712 }, { "name": "model.layers.44.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.8975600823978311e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.996325853629969e-05, "sensitivity": 0.7122061538959272 }, { "name": "model.layers.44.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1525788977451157e-05, "sensitivity": 1.2216221990266511 }, { "name": "model.layers.44.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.102799367610714e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.466695049311966e-05, "sensitivity": 0.674915975999408 }, { "name": "model.layers.44.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007429630495607853, "sensitivity": 0.5398022010981032 }, { "name": "model.layers.44.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.316346793435514e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006879197317175567, "sensitivity": 0.5374090369337753 }, { "name": "model.layers.44.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008313389262184501, "sensitivity": 0.5472672984432546 }, { "name": "model.layers.44.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.031737135956064e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008202940225601196, "sensitivity": 0.570002736123001 }, { "name": "model.layers.44.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.603166548302397e-05, "sensitivity": 0.7076216491883703 }, { "name": "model.layers.44.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0680746527214069e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.698216020595282e-05, "sensitivity": 0.7603605918216456 }, { "name": "model.layers.44.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.696420314256102e-05, "sensitivity": 0.8281837761046184 }, { "name": "model.layers.44.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.500386456944398e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007019552285782993, "sensitivity": 0.5453882254926399 }, { "name": "model.layers.44.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.251256465679035e-05, "sensitivity": 1.1647941312434615 }, { "name": "model.layers.44.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0579399258858757e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.354296394623816e-05, "sensitivity": 0.7743960439881242 }, { "name": "model.layers.44.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007645798614248633, "sensitivity": 0.560114160855434 }, { "name": "model.layers.44.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.501494560026913e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007166076684370637, "sensitivity": 0.5613524237335158 }, { "name": "model.layers.44.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.249680154724047e-05, "sensitivity": 0.7720597356644348 }, { "name": "model.layers.44.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.280718131776666e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.34316893410869e-05, "sensitivity": 0.6911628631263855 }, { "name": "model.layers.44.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.266632746905088e-05, "sensitivity": 0.6300447885097535 }, { "name": "model.layers.44.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.653244887886103e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.816141442162916e-05, "sensitivity": 0.6540185411302251 }, { "name": "model.layers.44.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.343649874906987e-05, "sensitivity": 0.7140350396577568 }, { "name": "model.layers.44.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.245166327469633e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006859024288132787, "sensitivity": 0.5891826090574122 }, { "name": "model.layers.44.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007456468301825225, "sensitivity": 0.5791775445499563 }, { "name": "model.layers.44.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.04443970991997e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007078940980136395, "sensitivity": 0.542839422243419 }, { "name": "model.layers.44.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007623056881129742, "sensitivity": 0.5381048850190859 }, { "name": "model.layers.44.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0540120456425939e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.231208681128919e-05, "sensitivity": 0.6364689744329334 }, { "name": "model.layers.44.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007214054930955172, "sensitivity": 0.5311143484002249 }, { "name": "model.layers.44.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.663720905133232e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006334614008665085, "sensitivity": 0.5333600968004883 }, { "name": "model.layers.44.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000753675471059978, "sensitivity": 0.5961642569228527 }, { "name": "model.layers.44.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1277958265054622e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.528384983539581e-05, "sensitivity": 0.6755461818455213 }, { "name": "model.layers.44.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.45841971365735e-05, "sensitivity": 0.6608783117646649 }, { "name": "model.layers.44.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0698666983444127e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007934842724353075, "sensitivity": 0.5702038100252409 }, { "name": "model.layers.44.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007586389547213912, "sensitivity": 0.5191057090665521 }, { "name": "model.layers.44.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.136217613558983e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006996816955506802, "sensitivity": 0.5844370328889706 }, { "name": "model.layers.44.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.812562060076743e-05, "sensitivity": 0.8555029725419618 }, { "name": "model.layers.44.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1075313750552596e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007150328601710498, "sensitivity": 0.5271277172261417 }, { "name": "model.layers.44.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007386220386251807, "sensitivity": 0.518742872844671 }, { "name": "model.layers.44.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.743199941818602e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006678660283796489, "sensitivity": 0.5461431301202322 }, { "name": "model.layers.44.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.294927152339369e-05, "sensitivity": 0.818410091139163 }, { "name": "model.layers.44.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.467365321645048e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006704164552502334, "sensitivity": 0.5619190397834481 }, { "name": "model.layers.44.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007445893133990467, "sensitivity": 0.5834456394067822 }, { "name": "model.layers.44.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.524103481642669e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.989665805827826e-05, "sensitivity": 0.9110527778662919 }, { "name": "model.layers.44.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.756022048648447e-05, "sensitivity": 0.7561394837321828 }, { "name": "model.layers.44.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 7.643997719242179e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007632838096469641, "sensitivity": 0.52548852253232 }, { "name": "model.layers.44.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.094675675034523e-05, "sensitivity": 0.8177387659972656 }, { "name": "model.layers.44.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0698515779949958e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.745149585185573e-05, "sensitivity": 0.7171505418639965 }, { "name": "model.layers.44.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.273128721863031e-05, "sensitivity": 1.0896686426673539 }, { "name": "model.layers.44.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.637275772736757e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.2088055882486515e-05, "sensitivity": 1.2219474915583042 }, { "name": "model.layers.44.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.350595504045486e-05, "sensitivity": 0.6535044166260798 }, { "name": "model.layers.44.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2775096820405452e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.259721703827381e-05, "sensitivity": 0.7063881307457813 }, { "name": "model.layers.44.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0006969644455239177, "sensitivity": 0.520083351943519 }, { "name": "model.layers.44.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.637068162897776e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0006544226198457181, "sensitivity": 0.5253550249067844 }, { "name": "model.layers.44.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007302109152078629, "sensitivity": 0.5881302104037117 }, { "name": "model.layers.44.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.314170483776252e-07, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.715731458622031e-05, "sensitivity": 0.641668817816082 }, { "name": "model.layers.44.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.1670270396280102e-05, "sensitivity": 1.3064555404147842 }, { "name": "model.layers.44.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2756634077959461e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.984999006614089e-05, "sensitivity": 0.6487234972604823 }, { "name": "model.layers.44.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.239545084303245e-05, "sensitivity": 0.8995384246782281 }, { "name": "model.layers.44.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3915672525399714e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007861024932935834, "sensitivity": 0.5852179650140402 }, { "name": "model.layers.44.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 1.3930941804574104e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.4206801779437228e-06, "sensitivity": 2.109324169447973 }, { "name": "model.layers.44.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.071534931426868e-06, "sensitivity": 10.0 }, { "name": "model.layers.44.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 1.8237462882098043e-06, "sensitivity": 2.109686841069944 }, { "name": "model.layers.44.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 8.779413292359095e-06, "sensitivity": 2.199125208609128 }, { "name": "model.layers.44.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00021412920614238828, "sensitivity": 0.8263706462301548 }, { "name": "model.layers.44.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 2.0100136680412106e-05, "sensitivity": 1.0268966674290965 }, { "name": "model.layers.44.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 4.4510372390504926e-05, "sensitivity": 0.7496715369361794 }, { "name": "model.layers.44.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 3, "mse": 0.00029851519502699375, "sensitivity": 1.055959375796814 }, { "name": "model.layers.45.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008600009023211896, "sensitivity": 0.5435860710160527 }, { "name": "model.layers.45.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.046729587680602e-07, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000743160373531282, "sensitivity": 0.5506728871783448 }, { "name": "model.layers.45.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.024513615760952e-05, "sensitivity": 1.1540542245304195 }, { "name": "model.layers.45.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3937427638666122e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.747378938598558e-05, "sensitivity": 1.0022106468755 }, { "name": "model.layers.45.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.948078564368188e-05, "sensitivity": 0.65736489895252 }, { "name": "model.layers.45.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0747853593784384e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.615039794472978e-05, "sensitivity": 1.1840304800767387 }, { "name": "model.layers.45.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.882092904765159e-05, "sensitivity": 0.607888938247712 }, { "name": "model.layers.45.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4761275224373094e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.807036697864532e-05, "sensitivity": 0.6419111823366458 }, { "name": "model.layers.45.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.179785461630672e-05, "sensitivity": 0.8791290221728143 }, { "name": "model.layers.45.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.53728999775194e-07, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.576157466042787e-05, "sensitivity": 1.0350647001931104 }, { "name": "model.layers.45.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008505347068421543, "sensitivity": 0.5203128684251301 }, { "name": "model.layers.45.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1934038184335805e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007341510499827564, "sensitivity": 0.5917580637720207 }, { "name": "model.layers.45.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008646544883958995, "sensitivity": 0.549273239592306 }, { "name": "model.layers.45.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.0447553197300294e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.628358096349984e-05, "sensitivity": 0.7193673270288038 }, { "name": "model.layers.45.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.52217456465587e-05, "sensitivity": 0.832713581063116 }, { "name": "model.layers.45.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.7663485323282657e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.315495506394655e-05, "sensitivity": 0.834350547174187 }, { "name": "model.layers.45.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008097131503745914, "sensitivity": 0.5447011490242103 }, { "name": "model.layers.45.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0236424259346677e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007172293844632804, "sensitivity": 0.5842466440308783 }, { "name": "model.layers.45.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008094538934528828, "sensitivity": 0.5482884710447236 }, { "name": "model.layers.45.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0045630460808752e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 5.606769991572946e-05, "sensitivity": 0.6200274908383099 }, { "name": "model.layers.45.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 8.146620530169457e-05, "sensitivity": 0.7268170078544545 }, { "name": "model.layers.45.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4117216551312595e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.241707109846175e-05, "sensitivity": 0.7522055690562526 }, { "name": "model.layers.45.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.4123094842943829e-05, "sensitivity": 1.4735931765425454 }, { "name": "model.layers.45.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4088473108131438e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.931531243026257e-05, "sensitivity": 1.0630676238422683 }, { "name": "model.layers.45.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 8.087315654847771e-05, "sensitivity": 1.1638864973176737 }, { "name": "model.layers.45.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2484970284276642e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.995428702794015e-05, "sensitivity": 0.6666885803855858 }, { "name": "model.layers.45.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0009171671117655933, "sensitivity": 0.5847369702657312 }, { "name": "model.layers.45.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.815205430641072e-07, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.384286436717957e-05, "sensitivity": 0.7972932179652155 }, { "name": "model.layers.45.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0009095397545024753, "sensitivity": 0.5740220731407834 }, { "name": "model.layers.45.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1650809028651565e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.679140253458172e-05, "sensitivity": 0.7787535867250746 }, { "name": "model.layers.45.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 8.002850518096238e-05, "sensitivity": 0.6098539326450604 }, { "name": "model.layers.45.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.750546041686903e-07, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008328684489242733, "sensitivity": 0.5995219646601182 }, { "name": "model.layers.45.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0009044675971381366, "sensitivity": 0.5354644805419131 }, { "name": "model.layers.45.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0524157687541447e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008785586105659604, "sensitivity": 0.5995457089863592 }, { "name": "model.layers.45.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.95809319242835e-05, "sensitivity": 0.602592473754132 }, { "name": "model.layers.45.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1103860515504493e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.494816236430779e-05, "sensitivity": 0.6465268142636209 }, { "name": "model.layers.45.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008715951698832214, "sensitivity": 0.5560060637628348 }, { "name": "model.layers.45.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.7979626818487304e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007868236862123013, "sensitivity": 0.5655758646821407 }, { "name": "model.layers.45.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.304440077859908e-05, "sensitivity": 0.9320252594344762 }, { "name": "model.layers.45.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0239521088806214e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.879839929752052e-05, "sensitivity": 0.9652409338553909 }, { "name": "model.layers.45.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000919818296097219, "sensitivity": 0.5554920072441601 }, { "name": "model.layers.45.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2060945664416067e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008803682285360992, "sensitivity": 0.5513065051055324 }, { "name": "model.layers.45.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.581223326269537e-05, "sensitivity": 0.6335120448350059 }, { "name": "model.layers.45.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2763775885105133e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.028868276393041e-05, "sensitivity": 0.7125139518317568 }, { "name": "model.layers.45.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.597616058774292e-05, "sensitivity": 0.6395563474129953 }, { "name": "model.layers.45.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4403524346562335e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.756697985110804e-05, "sensitivity": 0.8842266949559046 }, { "name": "model.layers.45.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008727246895432472, "sensitivity": 0.5620232534408834 }, { "name": "model.layers.45.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0517534292375785e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.450472574215382e-05, "sensitivity": 0.7217371036056702 }, { "name": "model.layers.45.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008798248018138111, "sensitivity": 0.5486489822778139 }, { "name": "model.layers.45.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1122886007797206e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.612383731408045e-05, "sensitivity": 0.6152507051274791 }, { "name": "model.layers.45.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008623792673461139, "sensitivity": 0.5581546407592876 }, { "name": "model.layers.45.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.575137482897844e-07, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.101475785020739e-05, "sensitivity": 0.6139406791663458 }, { "name": "model.layers.45.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000856596976518631, "sensitivity": 0.5436020591007983 }, { "name": "model.layers.45.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0080069614559761e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.015408482402563e-05, "sensitivity": 0.7915416014956301 }, { "name": "model.layers.45.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.53757412894629e-05, "sensitivity": 0.744623582736799 }, { "name": "model.layers.45.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2846370509578264e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.957879668334499e-05, "sensitivity": 0.6233761042501029 }, { "name": "model.layers.45.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007994830375537276, "sensitivity": 0.5615007742590838 }, { "name": "model.layers.45.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1242632353969384e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.1666200407489669e-05, "sensitivity": 1.314444718647411 }, { "name": "model.layers.45.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008593471138738096, "sensitivity": 0.5524806825242047 }, { "name": "model.layers.45.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.392069273417292e-07, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008339385385625064, "sensitivity": 0.595661811184303 }, { "name": "model.layers.45.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000833032769151032, "sensitivity": 0.537004883534392 }, { "name": "model.layers.45.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0002278258980368e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007419927860610187, "sensitivity": 0.568868829604811 }, { "name": "model.layers.45.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.707197073614225e-05, "sensitivity": 0.7863390107230465 }, { "name": "model.layers.45.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.7770371414371766e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008123075822368264, "sensitivity": 0.5734454764030495 }, { "name": "model.layers.45.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008495566435158253, "sensitivity": 0.5838700618537951 }, { "name": "model.layers.45.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0017761269409675e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.460231088567525e-05, "sensitivity": 0.6396176944263368 }, { "name": "model.layers.45.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.3489179764292203e-05, "sensitivity": 1.3491291572207988 }, { "name": "model.layers.45.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3763418564849417e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.4518842363031581e-05, "sensitivity": 1.638372254932843 }, { "name": "model.layers.45.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007727860938757658, "sensitivity": 0.5824213722269633 }, { "name": "model.layers.45.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2392486041790107e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.0481845139293e-05, "sensitivity": 0.6221593449538874 }, { "name": "model.layers.45.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 8.640624582767487e-05, "sensitivity": 0.7051051115473276 }, { "name": "model.layers.45.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.339798927801894e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.220498420996591e-05, "sensitivity": 0.6361243893088147 }, { "name": "model.layers.45.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.59319809731096e-05, "sensitivity": 0.7761376782442868 }, { "name": "model.layers.45.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0184974144067382e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007923810044303536, "sensitivity": 0.5566104328088077 }, { "name": "model.layers.45.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.591672328999266e-05, "sensitivity": 0.7289159421644413 }, { "name": "model.layers.45.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.117852207244141e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007684823940508068, "sensitivity": 0.5969862758303993 }, { "name": "model.layers.45.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 8.016926585696638e-05, "sensitivity": 0.8013085699725335 }, { "name": "model.layers.45.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.9497763332765317e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.70556871430017e-05, "sensitivity": 0.6255811217894212 }, { "name": "model.layers.45.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 8.820625953376293e-05, "sensitivity": 0.7689361292278383 }, { "name": "model.layers.45.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.50554785705026e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.391047595068812e-05, "sensitivity": 0.6352617466701862 }, { "name": "model.layers.45.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 8.332041761605069e-05, "sensitivity": 0.7134652049651453 }, { "name": "model.layers.45.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1282195373496506e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.000814079015981406, "sensitivity": 0.5531449510710328 }, { "name": "model.layers.45.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008538783877156675, "sensitivity": 0.5921694801484423 }, { "name": "model.layers.45.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0664305136742769e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.612384459003806e-05, "sensitivity": 0.6099073000491493 }, { "name": "model.layers.45.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.967992132762447e-05, "sensitivity": 0.8802183240568815 }, { "name": "model.layers.45.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.016517671814654e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.663148426217958e-05, "sensitivity": 0.6767365173728368 }, { "name": "model.layers.45.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.57361961202696e-05, "sensitivity": 0.9463141048833418 }, { "name": "model.layers.45.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2430740525815054e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.115067662904039e-05, "sensitivity": 0.7647484654674149 }, { "name": "model.layers.45.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.263537554536015e-05, "sensitivity": 0.8983198284253251 }, { "name": "model.layers.45.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.948944352800027e-07, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.204983558040112e-05, "sensitivity": 0.8056458139962067 }, { "name": "model.layers.45.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.217511301860213e-05, "sensitivity": 0.7975619966445967 }, { "name": "model.layers.45.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.8407303059575497e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.942470645299181e-05, "sensitivity": 0.7011462274397455 }, { "name": "model.layers.45.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.486416143365204e-05, "sensitivity": 0.6548094081062197 }, { "name": "model.layers.45.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6775178437455907e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.085640052333474e-05, "sensitivity": 0.7428441666307954 }, { "name": "model.layers.45.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008079198887571692, "sensitivity": 0.5745595502906116 }, { "name": "model.layers.45.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.104953526009922e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.058688086341135e-05, "sensitivity": 1.051264510919514 }, { "name": "model.layers.45.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.257718243636191e-05, "sensitivity": 0.9347630696326128 }, { "name": "model.layers.45.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.063857212102448e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007589695742353797, "sensitivity": 0.5928776712023085 }, { "name": "model.layers.45.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.142200774978846e-05, "sensitivity": 0.6337081658470192 }, { "name": "model.layers.45.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.721343303681351e-07, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.72074020258151e-05, "sensitivity": 0.6764692018687412 }, { "name": "model.layers.45.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0007837309967726469, "sensitivity": 0.5977007336789903 }, { "name": "model.layers.45.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 3.965688847529236e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007097739726305008, "sensitivity": 0.5896044651783394 }, { "name": "model.layers.45.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.667703903280199e-05, "sensitivity": 0.6794212594258718 }, { "name": "model.layers.45.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3990733123137034e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.335349800996482e-05, "sensitivity": 0.691034160731711 }, { "name": "model.layers.45.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 6.920025043655187e-05, "sensitivity": 0.8619781022863682 }, { "name": "model.layers.45.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4377413890542812e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.612152355955914e-05, "sensitivity": 0.6367353813153447 }, { "name": "model.layers.45.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.944137178128585e-05, "sensitivity": 1.0409026711545604 }, { "name": "model.layers.45.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 8.935154482969665e-07, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008151166839525104, "sensitivity": 0.5790338712880684 }, { "name": "model.layers.45.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.569514855276793e-05, "sensitivity": 0.9380654540488218 }, { "name": "model.layers.45.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6169117316167103e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.306864426936954e-05, "sensitivity": 0.9124794054286507 }, { "name": "model.layers.45.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000898249913007021, "sensitivity": 0.5997248210926773 }, { "name": "model.layers.45.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.392456852045143e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.960241444176063e-05, "sensitivity": 0.939249540965095 }, { "name": "model.layers.45.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008494501817040145, "sensitivity": 0.5814815137109908 }, { "name": "model.layers.45.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.221024583894177e-07, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.03753248672001e-05, "sensitivity": 0.6350799936498673 }, { "name": "model.layers.45.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.000905133318156004, "sensitivity": 0.5948087874525744 }, { "name": "model.layers.45.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.2555495888809673e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.207999442471191e-05, "sensitivity": 0.6498325910795187 }, { "name": "model.layers.45.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.3318956007424276e-05, "sensitivity": 1.4048044276371554 }, { "name": "model.layers.45.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1067650120821781e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.2705127119261306e-05, "sensitivity": 1.2243219626895918 }, { "name": "model.layers.45.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.650037878192961e-05, "sensitivity": 0.607927158014021 }, { "name": "model.layers.45.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0490066415513866e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0007089567370712757, "sensitivity": 0.5794112279122521 }, { "name": "model.layers.45.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 8.471207547700033e-05, "sensitivity": 0.9166432664662603 }, { "name": "model.layers.45.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2001246432191692e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.199881267501041e-05, "sensitivity": 0.6246974648169094 }, { "name": "model.layers.45.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.494653982575983e-05, "sensitivity": 0.8525392025019264 }, { "name": "model.layers.45.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 9.7172642199439e-07, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.909861258463934e-05, "sensitivity": 0.6142372547637023 }, { "name": "model.layers.45.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 7.95376327005215e-05, "sensitivity": 0.6603417796074791 }, { "name": "model.layers.45.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.518030669307336e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.560780457220972e-05, "sensitivity": 0.6296475229566127 }, { "name": "model.layers.45.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0008393779280595481, "sensitivity": 0.5716619571933604 }, { "name": "model.layers.45.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0123412721441127e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 6.464013131335378e-05, "sensitivity": 0.6108437835235075 }, { "name": "model.layers.45.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 1.8190205537393922e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 1.6067961041699164e-06, "sensitivity": 2.1083288145833645 }, { "name": "model.layers.45.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.926980636810185e-06, "sensitivity": 10.0 }, { "name": "model.layers.45.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 2.0644049527618336e-06, "sensitivity": 2.109535532406374 }, { "name": "model.layers.45.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 1.013837299979059e-05, "sensitivity": 2.2204466115840265 }, { "name": "model.layers.45.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00017677027790341526, "sensitivity": 0.8236962237716552 }, { "name": "model.layers.45.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 2.1967405700706877e-05, "sensitivity": 0.8446330295454528 }, { "name": "model.layers.45.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 4.876946331933141e-05, "sensitivity": 0.8716644334658985 }, { "name": "model.layers.45.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 4, "mse": 4.9542071792529896e-05, "sensitivity": 1.5901123538979212 }, { "name": "model.layers.46.mlp.experts.0.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00013053754810243845, "sensitivity": 1.1540859258735257 }, { "name": "model.layers.46.mlp.experts.0.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.122098521795124e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.0.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.381332736462355e-05, "sensitivity": 0.6905156466636507 }, { "name": "model.layers.46.mlp.experts.1.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010879666660912335, "sensitivity": 0.8795830257682993 }, { "name": "model.layers.46.mlp.experts.1.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.0300094547565095e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.1.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0009560708422213793, "sensitivity": 0.5719404433138788 }, { "name": "model.layers.46.mlp.experts.10.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 8.474296191707253e-05, "sensitivity": 0.6319915408349575 }, { "name": "model.layers.46.mlp.experts.10.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.8695718608796597e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.10.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.249541133409366e-05, "sensitivity": 0.655211592740122 }, { "name": "model.layers.46.mlp.experts.11.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 9.738648077473044e-05, "sensitivity": 1.0485965012833631 }, { "name": "model.layers.46.mlp.experts.11.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4594719459637417e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.11.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.301745740231127e-05, "sensitivity": 0.6655316393403599 }, { "name": "model.layers.46.mlp.experts.12.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00011350627028150484, "sensitivity": 0.7450068331748543 }, { "name": "model.layers.46.mlp.experts.12.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.154917183361249e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.12.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.293020073324442e-05, "sensitivity": 0.7598743987749716 }, { "name": "model.layers.46.mlp.experts.13.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010155553900403902, "sensitivity": 0.6072357724480051 }, { "name": "model.layers.46.mlp.experts.13.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1052422905777348e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.13.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008489048923365772, "sensitivity": 0.5843294537520678 }, { "name": "model.layers.46.mlp.experts.14.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 4.3360714698792435e-06, "sensitivity": 2.0987240938288028 }, { "name": "model.layers.46.mlp.experts.14.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.8251203073305078e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.14.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.868294389685616e-05, "sensitivity": 0.656203764879123 }, { "name": "model.layers.46.mlp.experts.15.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010342919267714024, "sensitivity": 0.8328166200227044 }, { "name": "model.layers.46.mlp.experts.15.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.7903067752486095e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.15.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.958554826676846e-05, "sensitivity": 0.955444338274527 }, { "name": "model.layers.46.mlp.experts.16.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 4.485902991291368e-06, "sensitivity": 2.098514128802802 }, { "name": "model.layers.46.mlp.experts.16.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.229585791406862e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.16.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0009584426297806203, "sensitivity": 0.5679928447078884 }, { "name": "model.layers.46.mlp.experts.17.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.8910803191829473e-05, "sensitivity": 1.6894713475979257 }, { "name": "model.layers.46.mlp.experts.17.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.991329781958484e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.17.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.333396883448586e-05, "sensitivity": 0.6873266003535886 }, { "name": "model.layers.46.mlp.experts.18.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.877342765510548e-05, "sensitivity": 1.4557419679800532 }, { "name": "model.layers.46.mlp.experts.18.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.8117798390449025e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.18.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.988658373709768e-05, "sensitivity": 0.6511999195623991 }, { "name": "model.layers.46.mlp.experts.19.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.943886309163645e-05, "sensitivity": 1.766829465468553 }, { "name": "model.layers.46.mlp.experts.19.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.7923524637808441e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.19.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.251554001821205e-05, "sensitivity": 0.8043060136197127 }, { "name": "model.layers.46.mlp.experts.2.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 2.1326462956494652e-05, "sensitivity": 1.9145930021211206 }, { "name": "model.layers.46.mlp.experts.2.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.273237896588398e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.2.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 3.756400019483408e-06, "sensitivity": 2.1006977676448204 }, { "name": "model.layers.46.mlp.experts.20.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 4.208316113363253e-06, "sensitivity": 2.0985394743905172 }, { "name": "model.layers.46.mlp.experts.20.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.8273898376719444e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.20.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.482372843194753e-05, "sensitivity": 0.601701657246742 }, { "name": "model.layers.46.mlp.experts.21.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 4.438781616045162e-06, "sensitivity": 2.099681206521256 }, { "name": "model.layers.46.mlp.experts.21.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.983027222100645e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.21.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.428702130913734e-05, "sensitivity": 0.9091180432871573 }, { "name": "model.layers.46.mlp.experts.22.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.0001066589611582458, "sensitivity": 0.7411979167223126 }, { "name": "model.layers.46.mlp.experts.22.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3109236078889808e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.22.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.679738337174058e-05, "sensitivity": 0.609772366496049 }, { "name": "model.layers.46.mlp.experts.23.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00012317218352109194, "sensitivity": 0.6840122977627195 }, { "name": "model.layers.46.mlp.experts.23.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1975281495324452e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.23.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.533964864909649e-05, "sensitivity": 0.6582890164146779 }, { "name": "model.layers.46.mlp.experts.24.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010157186625292525, "sensitivity": 0.6479654854701529 }, { "name": "model.layers.46.mlp.experts.24.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5207700698738336e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.24.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.100641571218148e-05, "sensitivity": 0.6125182949513044 }, { "name": "model.layers.46.mlp.experts.25.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010310176730854437, "sensitivity": 1.1445992463107237 }, { "name": "model.layers.46.mlp.experts.25.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.8988433794220327e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.25.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.00572379375808e-05, "sensitivity": 0.8686785132743036 }, { "name": "model.layers.46.mlp.experts.26.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00011125087621621788, "sensitivity": 0.6579409378281863 }, { "name": "model.layers.46.mlp.experts.26.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3023477549722884e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.26.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.517985017737374e-05, "sensitivity": 0.6187835364232087 }, { "name": "model.layers.46.mlp.experts.27.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 4.343546606833115e-06, "sensitivity": 2.099172251731805 }, { "name": "model.layers.46.mlp.experts.27.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.7955205748876324e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.27.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 2.0589632185874507e-05, "sensitivity": 1.282000454345655 }, { "name": "model.layers.46.mlp.experts.28.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010480178752914071, "sensitivity": 0.9511266975472541 }, { "name": "model.layers.46.mlp.experts.28.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2454079296730924e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.28.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.78891660249792e-05, "sensitivity": 0.6212760424958272 }, { "name": "model.layers.46.mlp.experts.29.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00011129312770208344, "sensitivity": 1.045023796846907 }, { "name": "model.layers.46.mlp.experts.29.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.927395715028979e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.29.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.514456905890256e-05, "sensitivity": 0.6545094700259033 }, { "name": "model.layers.46.mlp.experts.3.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010692574142012745, "sensitivity": 0.6556030107722463 }, { "name": "model.layers.46.mlp.experts.3.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.135741740654339e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.3.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008977591060101986, "sensitivity": 0.5794994307769875 }, { "name": "model.layers.46.mlp.experts.30.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 9.474702528677881e-05, "sensitivity": 1.0185753255162837 }, { "name": "model.layers.46.mlp.experts.30.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1864935913763475e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.30.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0009499727748334408, "sensitivity": 0.5684232739227039 }, { "name": "model.layers.46.mlp.experts.31.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 2.05737778742332e-05, "sensitivity": 1.2525790323625374 }, { "name": "model.layers.46.mlp.experts.31.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6598085039731814e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.31.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.280466474592686e-05, "sensitivity": 0.6635620850512902 }, { "name": "model.layers.46.mlp.experts.32.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 9.404008596902713e-05, "sensitivity": 1.0511673175938694 }, { "name": "model.layers.46.mlp.experts.32.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2180041721876478e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.32.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.113249689107761e-05, "sensitivity": 0.74070964156838 }, { "name": "model.layers.46.mlp.experts.33.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010200943506788462, "sensitivity": 0.9590632783069597 }, { "name": "model.layers.46.mlp.experts.33.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.199842927235295e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.33.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.727259410079569e-05, "sensitivity": 1.0429055356891057 }, { "name": "model.layers.46.mlp.experts.34.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 9.717916691442952e-05, "sensitivity": 0.6967245799783546 }, { "name": "model.layers.46.mlp.experts.34.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1343927326379344e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.34.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.960900984471664e-05, "sensitivity": 0.6088278551174666 }, { "name": "model.layers.46.mlp.experts.35.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010666543676052243, "sensitivity": 0.604445307411541 }, { "name": "model.layers.46.mlp.experts.35.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.996402716031298e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.35.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 3.6781354992854176e-06, "sensitivity": 2.0995149739351646 }, { "name": "model.layers.46.mlp.experts.36.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 5.305688318912871e-06, "sensitivity": 2.0998511110087104 }, { "name": "model.layers.46.mlp.experts.36.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.7987838418775937e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.36.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 0.00010054021549876779, "sensitivity": 1.1664491375364472 }, { "name": "model.layers.46.mlp.experts.37.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.001133376150391996, "sensitivity": 0.5807802798203303 }, { "name": "model.layers.46.mlp.experts.37.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.1788926005683606e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.37.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.867350697983056e-05, "sensitivity": 0.7596439744312654 }, { "name": "model.layers.46.mlp.experts.38.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010864916112041101, "sensitivity": 0.710252310294041 }, { "name": "model.layers.46.mlp.experts.38.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2010686987196095e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.38.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0008776218164712191, "sensitivity": 0.5922126000716875 }, { "name": "model.layers.46.mlp.experts.39.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.804723979148548e-05, "sensitivity": 1.3070558627436712 }, { "name": "model.layers.46.mlp.experts.39.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0657229267962975e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.39.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.90316189522855e-05, "sensitivity": 0.6329484402872412 }, { "name": "model.layers.46.mlp.experts.4.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.5606907254550606e-05, "sensitivity": 1.5075152295087124 }, { "name": "model.layers.46.mlp.experts.4.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 5.269886514724931e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.4.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.448414544342086e-05, "sensitivity": 0.9407550949597456 }, { "name": "model.layers.46.mlp.experts.40.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00011773363803513348, "sensitivity": 0.8233412587228348 }, { "name": "model.layers.46.mlp.experts.40.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6288553297272301e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.40.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0010520981159061193, "sensitivity": 0.58472057541629 }, { "name": "model.layers.46.mlp.experts.41.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.873902147053741e-05, "sensitivity": 1.320980657590054 }, { "name": "model.layers.46.mlp.experts.41.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2960615549673093e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.41.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.676039240323007e-05, "sensitivity": 0.6065435258129059 }, { "name": "model.layers.46.mlp.experts.42.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.751094350765925e-05, "sensitivity": 1.4766472995816475 }, { "name": "model.layers.46.mlp.experts.42.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.861512257368304e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.42.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 4.274795628589345e-06, "sensitivity": 2.0990434326036955 }, { "name": "model.layers.46.mlp.experts.43.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.0012073916150256991, "sensitivity": 0.5614323236678874 }, { "name": "model.layers.46.mlp.experts.43.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.421253500666353e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.43.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0009274596231989563, "sensitivity": 0.5873822556360889 }, { "name": "model.layers.46.mlp.experts.44.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010641371773090214, "sensitivity": 0.8012652369644389 }, { "name": "model.layers.46.mlp.experts.44.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.7673650063443347e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.44.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.86652123881504e-05, "sensitivity": 0.704389329413023 }, { "name": "model.layers.46.mlp.experts.45.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.7736878362484276e-05, "sensitivity": 1.543063093501421 }, { "name": "model.layers.46.mlp.experts.45.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.92630352305423e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.45.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.5093273759703152e-05, "sensitivity": 1.2489380806178527 }, { "name": "model.layers.46.mlp.experts.46.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 9.366613812744617e-05, "sensitivity": 0.8768244266247034 }, { "name": "model.layers.46.mlp.experts.46.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.0231756277789827e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.46.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0009026401676237583, "sensitivity": 0.5817323587133575 }, { "name": "model.layers.46.mlp.experts.47.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00011012342292815447, "sensitivity": 0.8910287122249305 }, { "name": "model.layers.46.mlp.experts.47.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.502993427493493e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.47.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.726939267944545e-05, "sensitivity": 0.7940473502668739 }, { "name": "model.layers.46.mlp.experts.48.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010842355550266802, "sensitivity": 0.8101608150012826 }, { "name": "model.layers.46.mlp.experts.48.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2980326573597267e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.48.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.429693454876542e-05, "sensitivity": 0.6318005057176563 }, { "name": "model.layers.46.mlp.experts.49.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 9.742174734128639e-05, "sensitivity": 0.9750642516618144 }, { "name": "model.layers.46.mlp.experts.49.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.5119048839551397e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.49.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.3263651453598868e-05, "sensitivity": 1.644600777455261 }, { "name": "model.layers.46.mlp.experts.5.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010652725177351385, "sensitivity": 0.7083801756341188 }, { "name": "model.layers.46.mlp.experts.5.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.071958533633733e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.5.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.945196168497205e-05, "sensitivity": 0.7658374839889344 }, { "name": "model.layers.46.mlp.experts.50.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 4.420996901899343e-06, "sensitivity": 2.100853909159902 }, { "name": "model.layers.46.mlp.experts.50.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.3869458800618304e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.50.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 0.0001221860875375569, "sensitivity": 0.9823834021216635 }, { "name": "model.layers.46.mlp.experts.51.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 4.28300063504139e-06, "sensitivity": 2.1006699222196135 }, { "name": "model.layers.46.mlp.experts.51.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 3.3507774332974805e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.51.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 6.529965958179673e-06, "sensitivity": 2.1025294138970536 }, { "name": "model.layers.46.mlp.experts.52.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010687959002098069, "sensitivity": 0.7623752716758115 }, { "name": "model.layers.46.mlp.experts.52.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.15448130297591e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.52.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.899572665337473e-05, "sensitivity": 0.8429427699608418 }, { "name": "model.layers.46.mlp.experts.53.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.001111392630264163, "sensitivity": 0.5829775525710755 }, { "name": "model.layers.46.mlp.experts.53.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.210277105201385e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.53.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.4761735656065866e-05, "sensitivity": 1.2011206045893417 }, { "name": "model.layers.46.mlp.experts.54.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 2, "mse": 0.001143809175118804, "sensitivity": 0.5909614605255281 }, { "name": "model.layers.46.mlp.experts.54.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1435654414526653e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.54.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0009809763869270682, "sensitivity": 0.549502466218953 }, { "name": "model.layers.46.mlp.experts.55.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 3.4544598292995943e-06, "sensitivity": 2.0986120611428976 }, { "name": "model.layers.46.mlp.experts.55.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.38709958466643e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.55.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.689740545582026e-05, "sensitivity": 0.8556894910267245 }, { "name": "model.layers.46.mlp.experts.56.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.0001061617731465958, "sensitivity": 0.633733003179401 }, { "name": "model.layers.46.mlp.experts.56.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.2861146387876943e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.56.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.191523036453873e-05, "sensitivity": 0.654646176216343 }, { "name": "model.layers.46.mlp.experts.57.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.898840673675295e-05, "sensitivity": 1.5125387803609518 }, { "name": "model.layers.46.mlp.experts.57.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3516355465981178e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.57.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0010475933086127043, "sensitivity": 0.5690659365014517 }, { "name": "model.layers.46.mlp.experts.58.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 1.819782301026862e-05, "sensitivity": 1.8490677158062097 }, { "name": "model.layers.46.mlp.experts.58.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.6007686554075917e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.58.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 8.326483657583594e-05, "sensitivity": 0.9632554009089189 }, { "name": "model.layers.46.mlp.experts.59.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 4, "mse": 2.346161454624962e-05, "sensitivity": 1.252072382418025 }, { "name": "model.layers.46.mlp.experts.59.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.531058615000802e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.59.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.694177626632154e-05, "sensitivity": 1.6539339185632622 }, { "name": "model.layers.46.mlp.experts.6.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 4.1555440475349315e-06, "sensitivity": 2.1001783274159425 }, { "name": "model.layers.46.mlp.experts.6.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 2.0449624571483582e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.6.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.90522894426249e-05, "sensitivity": 0.7466088728314594 }, { "name": "model.layers.46.mlp.experts.60.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 9.822245920076966e-05, "sensitivity": 0.7367763340266343 }, { "name": "model.layers.46.mlp.experts.60.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.916970177262556e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.60.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 7.404392817988992e-05, "sensitivity": 0.7022742210057766 }, { "name": "model.layers.46.mlp.experts.61.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010403658961877227, "sensitivity": 0.602251724658996 }, { "name": "model.layers.46.mlp.experts.61.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1604245173657546e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.61.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0009186958777718246, "sensitivity": 0.5806266291238447 }, { "name": "model.layers.46.mlp.experts.62.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.0001035523455357179, "sensitivity": 1.0184639926687642 }, { "name": "model.layers.46.mlp.experts.62.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.4906822798366193e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.62.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 9.227472764905542e-05, "sensitivity": 0.6510924613941828 }, { "name": "model.layers.46.mlp.experts.63.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00011185988842044026, "sensitivity": 0.8154791655724977 }, { "name": "model.layers.46.mlp.experts.63.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.828636754908075e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.63.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 3, "mse": 0.00010190786269959062, "sensitivity": 0.6719851156516655 }, { "name": "model.layers.46.mlp.experts.7.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.0001069737336365506, "sensitivity": 1.035304236231595 }, { "name": "model.layers.46.mlp.experts.7.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3336547226572293e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.7.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0009811162017285824, "sensitivity": 0.5917661447253096 }, { "name": "model.layers.46.mlp.experts.8.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.000111205896246247, "sensitivity": 0.645539685538388 }, { "name": "model.layers.46.mlp.experts.8.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.1488540394566371e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.8.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 4, "mse": 1.5673584130126983e-05, "sensitivity": 1.4376614323485015 }, { "name": "model.layers.46.mlp.experts.9.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 3, "mse": 0.00010624093556543812, "sensitivity": 1.1594959807731062 }, { "name": "model.layers.46.mlp.experts.9.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 1.3168137229513377e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.experts.9.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 2, "mse": 0.0009507543290965259, "sensitivity": 0.5835253820331218 }, { "name": "model.layers.46.mlp.gate.weight", "shape": [ 64, 2048 ], "bits": 6, "mse": 3.142298965030932e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.shared_experts.down_proj.weight", "shape": [ 2048, 1536 ], "bits": 5, "mse": 2.402887275820831e-06, "sensitivity": 2.1124414328273495 }, { "name": "model.layers.46.mlp.shared_experts.gate_proj.weight", "shape": [ 1536, 2048 ], "bits": 6, "mse": 4.825660653295927e-06, "sensitivity": 10.0 }, { "name": "model.layers.46.mlp.shared_experts.up_proj.weight", "shape": [ 1536, 2048 ], "bits": 5, "mse": 3.40148631039483e-06, "sensitivity": 2.1102974568803563 }, { "name": "model.layers.46.self_attn.kv_a_proj_with_mqa.weight", "shape": [ 576, 2048 ], "bits": 5, "mse": 8.597387932240963e-06, "sensitivity": 2.225498087223552 }, { "name": "model.layers.46.self_attn.kv_b_proj.weight", "shape": [ 8960, 512 ], "bits": 3, "mse": 0.00020850496366620064, "sensitivity": 1.0691658795041334 }, { "name": "model.layers.46.self_attn.o_proj.weight", "shape": [ 2048, 5120 ], "bits": 4, "mse": 1.890434396045748e-05, "sensitivity": 1.5446165103703402 }, { "name": "model.layers.46.self_attn.q_a_proj.weight", "shape": [ 768, 2048 ], "bits": 3, "mse": 3.232548988307826e-05, "sensitivity": 0.7564150290413465 }, { "name": "model.layers.46.self_attn.q_b_proj.weight", "shape": [ 5120, 768 ], "bits": 4, "mse": 7.500631909351796e-05, "sensitivity": 1.3365260246052333 } ] }