Text-to-Speech
Transformers
Safetensors
higgs_multimodal_qwen3
text-generation
speech-generation
higgs-audio
qwen3
quantization
4-bit precision
awq
Instructions to use Reza2kn/Higgs-Audio-v3-TTS-4bit-AWQ with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use Reza2kn/Higgs-Audio-v3-TTS-4bit-AWQ with Transformers:
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("text-to-speech", model="Reza2kn/Higgs-Audio-v3-TTS-4bit-AWQ")# Load model directly from transformers import AutoModelForSeq2SeqLM model = AutoModelForSeq2SeqLM.from_pretrained("Reza2kn/Higgs-Audio-v3-TTS-4bit-AWQ", dtype="auto") - Notebooks
- Google Colab
- Kaggle
| { | |
| "count": 252, | |
| "max_rel_l2": 0.11238045245409012, | |
| "mean_rel_l2": 0.06897487713112718, | |
| "max_abs_error": 0.07962238788604736, | |
| "tensors": [ | |
| { | |
| "name": "body.layers.0.mlp.down_proj.weight", | |
| "rel_l2": 0.07596064358949661, | |
| "max_abs": 0.03170572221279144, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.0.mlp.gate_proj.weight", | |
| "rel_l2": 0.07382253557443619, | |
| "max_abs": 0.02472330629825592, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.0.mlp.up_proj.weight", | |
| "rel_l2": 0.07318302243947983, | |
| "max_abs": 0.01948242262005806, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.0.self_attn.k_proj.weight", | |
| "rel_l2": 0.06984613835811615, | |
| "max_abs": 0.01751302182674408, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.0.self_attn.o_proj.weight", | |
| "rel_l2": 0.08070118725299835, | |
| "max_abs": 0.03001301735639572, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.0.self_attn.q_proj.weight", | |
| "rel_l2": 0.07181426137685776, | |
| "max_abs": 0.03404948115348816, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.0.self_attn.v_proj.weight", | |
| "rel_l2": 0.07539399713277817, | |
| "max_abs": 0.00996093824505806, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.1.mlp.down_proj.weight", | |
| "rel_l2": 0.07532299309968948, | |
| "max_abs": 0.04707030951976776, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.1.mlp.gate_proj.weight", | |
| "rel_l2": 0.07333692163228989, | |
| "max_abs": 0.018847651779651642, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.1.mlp.up_proj.weight", | |
| "rel_l2": 0.07860323041677475, | |
| "max_abs": 0.01565755158662796, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.1.self_attn.k_proj.weight", | |
| "rel_l2": 0.07382981479167938, | |
| "max_abs": 0.01249186135828495, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.1.self_attn.o_proj.weight", | |
| "rel_l2": 0.07480081170797348, | |
| "max_abs": 0.0257161483168602, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.1.self_attn.q_proj.weight", | |
| "rel_l2": 0.07748466730117798, | |
| "max_abs": 0.02509765326976776, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.1.self_attn.v_proj.weight", | |
| "rel_l2": 0.07837365567684174, | |
| "max_abs": 0.009179685264825821, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.10.mlp.down_proj.weight", | |
| "rel_l2": 0.06622204184532166, | |
| "max_abs": 0.05677083134651184, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.10.mlp.gate_proj.weight", | |
| "rel_l2": 0.06722308695316315, | |
| "max_abs": 0.034912109375, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.10.mlp.up_proj.weight", | |
| "rel_l2": 0.06583248823881149, | |
| "max_abs": 0.0377604141831398, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.10.self_attn.k_proj.weight", | |
| "rel_l2": 0.06801741570234299, | |
| "max_abs": 0.02412109076976776, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.10.self_attn.o_proj.weight", | |
| "rel_l2": 0.06308775395154953, | |
| "max_abs": 0.032421886920928955, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.10.self_attn.q_proj.weight", | |
| "rel_l2": 0.06795214116573334, | |
| "max_abs": 0.01612142100930214, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.10.self_attn.v_proj.weight", | |
| "rel_l2": 0.06346894800662994, | |
| "max_abs": 0.01075846329331398, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.11.mlp.down_proj.weight", | |
| "rel_l2": 0.06584431231021881, | |
| "max_abs": 0.04075521230697632, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.11.mlp.gate_proj.weight", | |
| "rel_l2": 0.0669279471039772, | |
| "max_abs": 0.02861328050494194, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.11.mlp.up_proj.weight", | |
| "rel_l2": 0.06534443795681, | |
| "max_abs": 0.02846679836511612, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.11.self_attn.k_proj.weight", | |
| "rel_l2": 0.06801076978445053, | |
| "max_abs": 0.02184244990348816, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.11.self_attn.o_proj.weight", | |
| "rel_l2": 0.06148053705692291, | |
| "max_abs": 0.029882818460464478, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.11.self_attn.q_proj.weight", | |
| "rel_l2": 0.06818917393684387, | |
| "max_abs": 0.019921869039535522, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.11.self_attn.v_proj.weight", | |
| "rel_l2": 0.06125301122665405, | |
| "max_abs": 0.011067710816860199, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.12.mlp.down_proj.weight", | |
| "rel_l2": 0.06559903919696808, | |
| "max_abs": 0.05670572817325592, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.12.mlp.gate_proj.weight", | |
| "rel_l2": 0.06648173183202744, | |
| "max_abs": 0.043701171875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.12.mlp.up_proj.weight", | |
| "rel_l2": 0.06457459181547165, | |
| "max_abs": 0.02776692807674408, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.12.self_attn.k_proj.weight", | |
| "rel_l2": 0.06599076837301254, | |
| "max_abs": 0.02783203125, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.12.self_attn.o_proj.weight", | |
| "rel_l2": 0.06351252645254135, | |
| "max_abs": 0.04173177480697632, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.12.self_attn.q_proj.weight", | |
| "rel_l2": 0.0672365054488182, | |
| "max_abs": 0.02031250298023224, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.12.self_attn.v_proj.weight", | |
| "rel_l2": 0.06122998520731926, | |
| "max_abs": 0.01409505121409893, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.13.mlp.down_proj.weight", | |
| "rel_l2": 0.06621025502681732, | |
| "max_abs": 0.0419921875, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.13.mlp.gate_proj.weight", | |
| "rel_l2": 0.06676726788282394, | |
| "max_abs": 0.029296875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.13.mlp.up_proj.weight", | |
| "rel_l2": 0.06489288061857224, | |
| "max_abs": 0.03893229365348816, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.13.self_attn.k_proj.weight", | |
| "rel_l2": 0.06673961132764816, | |
| "max_abs": 0.035400390625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.13.self_attn.o_proj.weight", | |
| "rel_l2": 0.06313878297805786, | |
| "max_abs": 0.0266927108168602, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.13.self_attn.q_proj.weight", | |
| "rel_l2": 0.0662655159831047, | |
| "max_abs": 0.019140630960464478, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.13.self_attn.v_proj.weight", | |
| "rel_l2": 0.05971594527363777, | |
| "max_abs": 0.01181640475988388, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.14.mlp.down_proj.weight", | |
| "rel_l2": 0.0663212463259697, | |
| "max_abs": 0.0442708283662796, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.14.mlp.gate_proj.weight", | |
| "rel_l2": 0.06703805178403854, | |
| "max_abs": 0.03013509139418602, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.14.mlp.up_proj.weight", | |
| "rel_l2": 0.06479182094335556, | |
| "max_abs": 0.0233154296875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.14.self_attn.k_proj.weight", | |
| "rel_l2": 0.06640790402889252, | |
| "max_abs": 0.016796879470348358, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.14.self_attn.o_proj.weight", | |
| "rel_l2": 0.06433359533548355, | |
| "max_abs": 0.03339843451976776, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.14.self_attn.q_proj.weight", | |
| "rel_l2": 0.06542882323265076, | |
| "max_abs": 0.01599934697151184, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.14.self_attn.v_proj.weight", | |
| "rel_l2": 0.06334666907787323, | |
| "max_abs": 0.01175130158662796, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.15.mlp.down_proj.weight", | |
| "rel_l2": 0.06664413213729858, | |
| "max_abs": 0.04335937649011612, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.15.mlp.gate_proj.weight", | |
| "rel_l2": 0.06717315316200256, | |
| "max_abs": 0.03684896230697632, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.15.mlp.up_proj.weight", | |
| "rel_l2": 0.06498843431472778, | |
| "max_abs": 0.02177734300494194, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.15.self_attn.k_proj.weight", | |
| "rel_l2": 0.06741718202829361, | |
| "max_abs": 0.02158202975988388, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.15.self_attn.o_proj.weight", | |
| "rel_l2": 0.06456878036260605, | |
| "max_abs": 0.02031250298023224, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.15.self_attn.q_proj.weight", | |
| "rel_l2": 0.06658957898616791, | |
| "max_abs": 0.02255859225988388, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.15.self_attn.v_proj.weight", | |
| "rel_l2": 0.06370850652456284, | |
| "max_abs": 0.01177978515625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.16.mlp.down_proj.weight", | |
| "rel_l2": 0.06702253222465515, | |
| "max_abs": 0.07962238788604736, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.16.mlp.gate_proj.weight", | |
| "rel_l2": 0.06753792613744736, | |
| "max_abs": 0.03125, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.16.mlp.up_proj.weight", | |
| "rel_l2": 0.06502605974674225, | |
| "max_abs": 0.06015622615814209, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.16.self_attn.k_proj.weight", | |
| "rel_l2": 0.06647730618715286, | |
| "max_abs": 0.01891276240348816, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.16.self_attn.o_proj.weight", | |
| "rel_l2": 0.06474900245666504, | |
| "max_abs": 0.0442708283662796, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.16.self_attn.q_proj.weight", | |
| "rel_l2": 0.06550220400094986, | |
| "max_abs": 0.017382808029651642, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.16.self_attn.v_proj.weight", | |
| "rel_l2": 0.06406065076589584, | |
| "max_abs": 0.011523440480232239, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.17.mlp.down_proj.weight", | |
| "rel_l2": 0.06819935888051987, | |
| "max_abs": 0.04375000298023224, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.17.mlp.gate_proj.weight", | |
| "rel_l2": 0.06768647581338882, | |
| "max_abs": 0.04104818403720856, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.17.mlp.up_proj.weight", | |
| "rel_l2": 0.0658210813999176, | |
| "max_abs": 0.0283203125, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.17.self_attn.k_proj.weight", | |
| "rel_l2": 0.0669577494263649, | |
| "max_abs": 0.01569010317325592, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.17.self_attn.o_proj.weight", | |
| "rel_l2": 0.06509929150342941, | |
| "max_abs": 0.030468732118606567, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.17.self_attn.q_proj.weight", | |
| "rel_l2": 0.06663322448730469, | |
| "max_abs": 0.0167643241584301, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.17.self_attn.v_proj.weight", | |
| "rel_l2": 0.06413859128952026, | |
| "max_abs": 0.01220703125, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.18.mlp.down_proj.weight", | |
| "rel_l2": 0.069343201816082, | |
| "max_abs": 0.03535155951976776, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.18.mlp.gate_proj.weight", | |
| "rel_l2": 0.06887821853160858, | |
| "max_abs": 0.04130859673023224, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.18.mlp.up_proj.weight", | |
| "rel_l2": 0.06599543988704681, | |
| "max_abs": 0.02828776091337204, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.18.self_attn.k_proj.weight", | |
| "rel_l2": 0.06672190129756927, | |
| "max_abs": 0.015380859375, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.18.self_attn.o_proj.weight", | |
| "rel_l2": 0.06514199078083038, | |
| "max_abs": 0.0255533866584301, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.18.self_attn.q_proj.weight", | |
| "rel_l2": 0.06533738970756531, | |
| "max_abs": 0.02151692658662796, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.18.self_attn.v_proj.weight", | |
| "rel_l2": 0.06499006599187851, | |
| "max_abs": 0.011881507933139801, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.19.mlp.down_proj.weight", | |
| "rel_l2": 0.07158460468053818, | |
| "max_abs": 0.03893229365348816, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.19.mlp.gate_proj.weight", | |
| "rel_l2": 0.07148076593875885, | |
| "max_abs": 0.03089192882180214, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.19.mlp.up_proj.weight", | |
| "rel_l2": 0.06830843538045883, | |
| "max_abs": 0.04251302778720856, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.19.self_attn.k_proj.weight", | |
| "rel_l2": 0.06735149025917053, | |
| "max_abs": 0.024804681539535522, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.19.self_attn.o_proj.weight", | |
| "rel_l2": 0.0672638788819313, | |
| "max_abs": 0.035937488079071045, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.19.self_attn.q_proj.weight", | |
| "rel_l2": 0.06672016531229019, | |
| "max_abs": 0.0189208984375, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.19.self_attn.v_proj.weight", | |
| "rel_l2": 0.06629148125648499, | |
| "max_abs": 0.012369789183139801, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.2.mlp.down_proj.weight", | |
| "rel_l2": 0.11238045245409012, | |
| "max_abs": 0.03826497495174408, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.2.mlp.gate_proj.weight", | |
| "rel_l2": 0.07709193229675293, | |
| "max_abs": 0.014973953366279602, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.2.mlp.up_proj.weight", | |
| "rel_l2": 0.07919403910636902, | |
| "max_abs": 0.02610676735639572, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.2.self_attn.k_proj.weight", | |
| "rel_l2": 0.06668715178966522, | |
| "max_abs": 0.0206298828125, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.2.self_attn.o_proj.weight", | |
| "rel_l2": 0.07104453444480896, | |
| "max_abs": 0.0262044295668602, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.2.self_attn.q_proj.weight", | |
| "rel_l2": 0.07025231420993805, | |
| "max_abs": 0.01800130307674408, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.2.self_attn.v_proj.weight", | |
| "rel_l2": 0.06964565068483353, | |
| "max_abs": 0.01171875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.20.mlp.down_proj.weight", | |
| "rel_l2": 0.07081551849842072, | |
| "max_abs": 0.02792968600988388, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.20.mlp.gate_proj.weight", | |
| "rel_l2": 0.0730258896946907, | |
| "max_abs": 0.031494140625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.20.mlp.up_proj.weight", | |
| "rel_l2": 0.06889849156141281, | |
| "max_abs": 0.0322265625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.20.self_attn.k_proj.weight", | |
| "rel_l2": 0.07111072540283203, | |
| "max_abs": 0.0165201798081398, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.20.self_attn.o_proj.weight", | |
| "rel_l2": 0.06483592092990875, | |
| "max_abs": 0.02851562201976776, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.20.self_attn.q_proj.weight", | |
| "rel_l2": 0.06793750822544098, | |
| "max_abs": 0.020117193460464478, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.20.self_attn.v_proj.weight", | |
| "rel_l2": 0.06551762670278549, | |
| "max_abs": 0.012532547116279602, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.21.mlp.down_proj.weight", | |
| "rel_l2": 0.07007616013288498, | |
| "max_abs": 0.050537109375, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.21.mlp.gate_proj.weight", | |
| "rel_l2": 0.07369518280029297, | |
| "max_abs": 0.03430989384651184, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.21.mlp.up_proj.weight", | |
| "rel_l2": 0.06783981621265411, | |
| "max_abs": 0.01787109673023224, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.21.self_attn.k_proj.weight", | |
| "rel_l2": 0.06944476813077927, | |
| "max_abs": 0.015299484133720398, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.21.self_attn.o_proj.weight", | |
| "rel_l2": 0.06496919691562653, | |
| "max_abs": 0.026041656732559204, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.21.self_attn.q_proj.weight", | |
| "rel_l2": 0.06691138446331024, | |
| "max_abs": 0.0213623046875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.21.self_attn.v_proj.weight", | |
| "rel_l2": 0.065667062997818, | |
| "max_abs": 0.015625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.22.mlp.down_proj.weight", | |
| "rel_l2": 0.06848417967557907, | |
| "max_abs": 0.03662109375, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.22.mlp.gate_proj.weight", | |
| "rel_l2": 0.07387233525514603, | |
| "max_abs": 0.0301513671875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.22.mlp.up_proj.weight", | |
| "rel_l2": 0.06605042517185211, | |
| "max_abs": 0.05032552033662796, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.22.self_attn.k_proj.weight", | |
| "rel_l2": 0.06903988867998123, | |
| "max_abs": 0.04098307341337204, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.22.self_attn.o_proj.weight", | |
| "rel_l2": 0.06529656797647476, | |
| "max_abs": 0.0302734375, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.22.self_attn.q_proj.weight", | |
| "rel_l2": 0.06673184782266617, | |
| "max_abs": 0.017968744039535522, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.22.self_attn.v_proj.weight", | |
| "rel_l2": 0.06573918461799622, | |
| "max_abs": 0.01414388045668602, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.23.mlp.down_proj.weight", | |
| "rel_l2": 0.06789179891347885, | |
| "max_abs": 0.0322265625, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.23.mlp.gate_proj.weight", | |
| "rel_l2": 0.07408707588911057, | |
| "max_abs": 0.03004557266831398, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.23.mlp.up_proj.weight", | |
| "rel_l2": 0.06625813990831375, | |
| "max_abs": 0.02068684995174408, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.23.self_attn.k_proj.weight", | |
| "rel_l2": 0.06929145008325577, | |
| "max_abs": 0.0169270820915699, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.23.self_attn.o_proj.weight", | |
| "rel_l2": 0.06800138205289841, | |
| "max_abs": 0.023111969232559204, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.23.self_attn.q_proj.weight", | |
| "rel_l2": 0.06745022535324097, | |
| "max_abs": 0.023046880960464478, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.23.self_attn.v_proj.weight", | |
| "rel_l2": 0.06665196269750595, | |
| "max_abs": 0.01291096955537796, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.24.mlp.down_proj.weight", | |
| "rel_l2": 0.07006856799125671, | |
| "max_abs": 0.03489583730697632, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.24.mlp.gate_proj.weight", | |
| "rel_l2": 0.07322349399328232, | |
| "max_abs": 0.0283203125, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.24.mlp.up_proj.weight", | |
| "rel_l2": 0.06784684956073761, | |
| "max_abs": 0.02001953125, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.24.self_attn.k_proj.weight", | |
| "rel_l2": 0.06916509568691254, | |
| "max_abs": 0.0166015625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.24.self_attn.o_proj.weight", | |
| "rel_l2": 0.06791326403617859, | |
| "max_abs": 0.021158859133720398, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.24.self_attn.q_proj.weight", | |
| "rel_l2": 0.06761031597852707, | |
| "max_abs": 0.01904296875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.24.self_attn.v_proj.weight", | |
| "rel_l2": 0.06186000630259514, | |
| "max_abs": 0.01474609225988388, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.25.mlp.down_proj.weight", | |
| "rel_l2": 0.07028895616531372, | |
| "max_abs": 0.025976553559303284, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.25.mlp.gate_proj.weight", | |
| "rel_l2": 0.07393249124288559, | |
| "max_abs": 0.03590495139360428, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.25.mlp.up_proj.weight", | |
| "rel_l2": 0.06790996342897415, | |
| "max_abs": 0.02373046800494194, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.25.self_attn.k_proj.weight", | |
| "rel_l2": 0.06831444054841995, | |
| "max_abs": 0.015625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.25.self_attn.o_proj.weight", | |
| "rel_l2": 0.06747766584157944, | |
| "max_abs": 0.0126953125, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.25.self_attn.q_proj.weight", | |
| "rel_l2": 0.06647656112909317, | |
| "max_abs": 0.01902668923139572, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.25.self_attn.v_proj.weight", | |
| "rel_l2": 0.06351126730442047, | |
| "max_abs": 0.011132806539535522, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.26.mlp.down_proj.weight", | |
| "rel_l2": 0.07111111283302307, | |
| "max_abs": 0.0286458320915699, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.26.mlp.gate_proj.weight", | |
| "rel_l2": 0.07467159628868103, | |
| "max_abs": 0.03746744990348816, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.26.mlp.up_proj.weight", | |
| "rel_l2": 0.06867961585521698, | |
| "max_abs": 0.03367512673139572, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.26.self_attn.k_proj.weight", | |
| "rel_l2": 0.07186003774404526, | |
| "max_abs": 0.01503906399011612, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.26.self_attn.o_proj.weight", | |
| "rel_l2": 0.06553354859352112, | |
| "max_abs": 0.014322921633720398, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.26.self_attn.q_proj.weight", | |
| "rel_l2": 0.06843607127666473, | |
| "max_abs": 0.017822265625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.26.self_attn.v_proj.weight", | |
| "rel_l2": 0.06072765961289406, | |
| "max_abs": 0.01081949844956398, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.27.mlp.down_proj.weight", | |
| "rel_l2": 0.07197169959545135, | |
| "max_abs": 0.025195300579071045, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.27.mlp.gate_proj.weight", | |
| "rel_l2": 0.0748187005519867, | |
| "max_abs": 0.02776692807674408, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.27.mlp.up_proj.weight", | |
| "rel_l2": 0.06902790814638138, | |
| "max_abs": 0.02871093899011612, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.27.self_attn.k_proj.weight", | |
| "rel_l2": 0.06958119571208954, | |
| "max_abs": 0.01507568359375, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.27.self_attn.o_proj.weight", | |
| "rel_l2": 0.06719069182872772, | |
| "max_abs": 0.0196940079331398, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.27.self_attn.q_proj.weight", | |
| "rel_l2": 0.06820857524871826, | |
| "max_abs": 0.017415359616279602, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.27.self_attn.v_proj.weight", | |
| "rel_l2": 0.06324808299541473, | |
| "max_abs": 0.01276041567325592, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.28.mlp.down_proj.weight", | |
| "rel_l2": 0.0742034986615181, | |
| "max_abs": 0.03821614384651184, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.28.mlp.gate_proj.weight", | |
| "rel_l2": 0.07764001935720444, | |
| "max_abs": 0.0286865234375, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.28.mlp.up_proj.weight", | |
| "rel_l2": 0.07109709084033966, | |
| "max_abs": 0.04168294370174408, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.28.self_attn.k_proj.weight", | |
| "rel_l2": 0.06993237882852554, | |
| "max_abs": 0.01386718824505806, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.28.self_attn.o_proj.weight", | |
| "rel_l2": 0.06693819165229797, | |
| "max_abs": 0.018880203366279602, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.28.self_attn.q_proj.weight", | |
| "rel_l2": 0.06869757920503616, | |
| "max_abs": 0.01640625298023224, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.28.self_attn.v_proj.weight", | |
| "rel_l2": 0.06167382374405861, | |
| "max_abs": 0.01193033903837204, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.29.mlp.down_proj.weight", | |
| "rel_l2": 0.07363142818212509, | |
| "max_abs": 0.025976553559303284, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.29.mlp.gate_proj.weight", | |
| "rel_l2": 0.07935639470815659, | |
| "max_abs": 0.0386556014418602, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.29.mlp.up_proj.weight", | |
| "rel_l2": 0.07232704758644104, | |
| "max_abs": 0.02382812649011612, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.29.self_attn.k_proj.weight", | |
| "rel_l2": 0.0734124481678009, | |
| "max_abs": 0.01712239533662796, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.29.self_attn.o_proj.weight", | |
| "rel_l2": 0.06708438694477081, | |
| "max_abs": 0.016666650772094727, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.29.self_attn.q_proj.weight", | |
| "rel_l2": 0.07113268226385117, | |
| "max_abs": 0.020182311534881592, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.29.self_attn.v_proj.weight", | |
| "rel_l2": 0.06106225401163101, | |
| "max_abs": 0.01533203199505806, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.3.mlp.down_proj.weight", | |
| "rel_l2": 0.08152986317873001, | |
| "max_abs": 0.03616536408662796, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.3.mlp.gate_proj.weight", | |
| "rel_l2": 0.07240079343318939, | |
| "max_abs": 0.02233073115348816, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.3.mlp.up_proj.weight", | |
| "rel_l2": 0.07463279366493225, | |
| "max_abs": 0.02154947817325592, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.3.self_attn.k_proj.weight", | |
| "rel_l2": 0.06854531913995743, | |
| "max_abs": 0.018033847212791443, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.3.self_attn.o_proj.weight", | |
| "rel_l2": 0.06809478998184204, | |
| "max_abs": 0.0244140625, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.3.self_attn.q_proj.weight", | |
| "rel_l2": 0.071794293820858, | |
| "max_abs": 0.02353515475988388, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.3.self_attn.v_proj.weight", | |
| "rel_l2": 0.06851097196340561, | |
| "max_abs": 0.010498046875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.30.mlp.down_proj.weight", | |
| "rel_l2": 0.07187923043966293, | |
| "max_abs": 0.03074544295668602, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.30.mlp.gate_proj.weight", | |
| "rel_l2": 0.07799259573221207, | |
| "max_abs": 0.0341796875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.30.mlp.up_proj.weight", | |
| "rel_l2": 0.07077936828136444, | |
| "max_abs": 0.02412109076976776, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.30.self_attn.k_proj.weight", | |
| "rel_l2": 0.0749228298664093, | |
| "max_abs": 0.01793619990348816, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.30.self_attn.o_proj.weight", | |
| "rel_l2": 0.0694289281964302, | |
| "max_abs": 0.016666650772094727, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.30.self_attn.q_proj.weight", | |
| "rel_l2": 0.07082075625658035, | |
| "max_abs": 0.02438151091337204, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.30.self_attn.v_proj.weight", | |
| "rel_l2": 0.061844345182180405, | |
| "max_abs": 0.01582030951976776, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.31.mlp.down_proj.weight", | |
| "rel_l2": 0.06976475566625595, | |
| "max_abs": 0.03763020038604736, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.31.mlp.gate_proj.weight", | |
| "rel_l2": 0.07731909304857254, | |
| "max_abs": 0.04296875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.31.mlp.up_proj.weight", | |
| "rel_l2": 0.07021760940551758, | |
| "max_abs": 0.0296630859375, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.31.self_attn.k_proj.weight", | |
| "rel_l2": 0.07398602366447449, | |
| "max_abs": 0.01609700545668602, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.31.self_attn.o_proj.weight", | |
| "rel_l2": 0.06957647204399109, | |
| "max_abs": 0.02086588740348816, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.31.self_attn.q_proj.weight", | |
| "rel_l2": 0.06946918368339539, | |
| "max_abs": 0.02080078423023224, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.31.self_attn.v_proj.weight", | |
| "rel_l2": 0.06264778971672058, | |
| "max_abs": 0.01165364496409893, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.32.mlp.down_proj.weight", | |
| "rel_l2": 0.06731897592544556, | |
| "max_abs": 0.037890613079071045, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.32.mlp.gate_proj.weight", | |
| "rel_l2": 0.07542521506547928, | |
| "max_abs": 0.0341796875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.32.mlp.up_proj.weight", | |
| "rel_l2": 0.06934364885091782, | |
| "max_abs": 0.03136393427848816, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.32.self_attn.k_proj.weight", | |
| "rel_l2": 0.07342707365751266, | |
| "max_abs": 0.01640625298023224, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.32.self_attn.o_proj.weight", | |
| "rel_l2": 0.07076826691627502, | |
| "max_abs": 0.02542317658662796, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.32.self_attn.q_proj.weight", | |
| "rel_l2": 0.06907843798398972, | |
| "max_abs": 0.02051595225930214, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.32.self_attn.v_proj.weight", | |
| "rel_l2": 0.06290274113416672, | |
| "max_abs": 0.01373291015625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.33.mlp.down_proj.weight", | |
| "rel_l2": 0.06806037575006485, | |
| "max_abs": 0.036376953125, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.33.mlp.gate_proj.weight", | |
| "rel_l2": 0.0751243457198143, | |
| "max_abs": 0.03606770932674408, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.33.mlp.up_proj.weight", | |
| "rel_l2": 0.06909118592739105, | |
| "max_abs": 0.024511724710464478, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.33.self_attn.k_proj.weight", | |
| "rel_l2": 0.07059690356254578, | |
| "max_abs": 0.013476565480232239, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.33.self_attn.o_proj.weight", | |
| "rel_l2": 0.07009471207857132, | |
| "max_abs": 0.028906241059303284, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.33.self_attn.q_proj.weight", | |
| "rel_l2": 0.06914056837558746, | |
| "max_abs": 0.0238037109375, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.33.self_attn.v_proj.weight", | |
| "rel_l2": 0.06516322493553162, | |
| "max_abs": 0.012011721730232239, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.34.mlp.down_proj.weight", | |
| "rel_l2": 0.09997338056564331, | |
| "max_abs": 0.04296875, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.34.mlp.gate_proj.weight", | |
| "rel_l2": 0.07913520932197571, | |
| "max_abs": 0.03585612028837204, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.34.mlp.up_proj.weight", | |
| "rel_l2": 0.08036722242832184, | |
| "max_abs": 0.0294596366584301, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.34.self_attn.k_proj.weight", | |
| "rel_l2": 0.07352534681558609, | |
| "max_abs": 0.018310546875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.34.self_attn.o_proj.weight", | |
| "rel_l2": 0.07350429147481918, | |
| "max_abs": 0.02255859225988388, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.34.self_attn.q_proj.weight", | |
| "rel_l2": 0.07281963527202606, | |
| "max_abs": 0.01930338516831398, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.34.self_attn.v_proj.weight", | |
| "rel_l2": 0.07139786332845688, | |
| "max_abs": 0.013964839279651642, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.35.mlp.down_proj.weight", | |
| "rel_l2": 0.0817723423242569, | |
| "max_abs": 0.03785806894302368, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.35.mlp.gate_proj.weight", | |
| "rel_l2": 0.07454026490449905, | |
| "max_abs": 0.04270832985639572, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.35.mlp.up_proj.weight", | |
| "rel_l2": 0.07056299597024918, | |
| "max_abs": 0.04303385317325592, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.35.self_attn.k_proj.weight", | |
| "rel_l2": 0.0727466270327568, | |
| "max_abs": 0.0247395820915699, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.35.self_attn.o_proj.weight", | |
| "rel_l2": 0.07178165018558502, | |
| "max_abs": 0.03512369841337204, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.35.self_attn.q_proj.weight", | |
| "rel_l2": 0.07691565155982971, | |
| "max_abs": 0.01951497420668602, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.35.self_attn.v_proj.weight", | |
| "rel_l2": 0.06240251287817955, | |
| "max_abs": 0.01171875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.4.mlp.down_proj.weight", | |
| "rel_l2": 0.08333507180213928, | |
| "max_abs": 0.028645843267440796, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.4.mlp.gate_proj.weight", | |
| "rel_l2": 0.07108590006828308, | |
| "max_abs": 0.0191650390625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.4.mlp.up_proj.weight", | |
| "rel_l2": 0.07116637378931046, | |
| "max_abs": 0.016894526779651642, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.4.self_attn.k_proj.weight", | |
| "rel_l2": 0.0647963210940361, | |
| "max_abs": 0.03131510317325592, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.4.self_attn.o_proj.weight", | |
| "rel_l2": 0.06481703370809555, | |
| "max_abs": 0.027734369039535522, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.4.self_attn.q_proj.weight", | |
| "rel_l2": 0.06910184770822525, | |
| "max_abs": 0.0208333358168602, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.4.self_attn.v_proj.weight", | |
| "rel_l2": 0.06265527755022049, | |
| "max_abs": 0.010449215769767761, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.5.mlp.down_proj.weight", | |
| "rel_l2": 0.06850583106279373, | |
| "max_abs": 0.0338541716337204, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.5.mlp.gate_proj.weight", | |
| "rel_l2": 0.06662628054618835, | |
| "max_abs": 0.03688150644302368, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.5.mlp.up_proj.weight", | |
| "rel_l2": 0.06648511439561844, | |
| "max_abs": 0.02688802033662796, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.5.self_attn.k_proj.weight", | |
| "rel_l2": 0.06616631895303726, | |
| "max_abs": 0.019856765866279602, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.5.self_attn.o_proj.weight", | |
| "rel_l2": 0.06722407042980194, | |
| "max_abs": 0.028385430574417114, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.5.self_attn.q_proj.weight", | |
| "rel_l2": 0.06911922246217728, | |
| "max_abs": 0.0201416015625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.5.self_attn.v_proj.weight", | |
| "rel_l2": 0.06332346796989441, | |
| "max_abs": 0.01103515550494194, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.6.mlp.down_proj.weight", | |
| "rel_l2": 0.06818147748708725, | |
| "max_abs": 0.03610025346279144, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.6.mlp.gate_proj.weight", | |
| "rel_l2": 0.06727603822946548, | |
| "max_abs": 0.0208333320915699, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.6.mlp.up_proj.weight", | |
| "rel_l2": 0.06784625351428986, | |
| "max_abs": 0.029052734375, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.6.self_attn.k_proj.weight", | |
| "rel_l2": 0.06962763518095016, | |
| "max_abs": 0.019775390625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.6.self_attn.o_proj.weight", | |
| "rel_l2": 0.06578625738620758, | |
| "max_abs": 0.034505218267440796, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.6.self_attn.q_proj.weight", | |
| "rel_l2": 0.07230403274297714, | |
| "max_abs": 0.03701172024011612, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.6.self_attn.v_proj.weight", | |
| "rel_l2": 0.06438400596380234, | |
| "max_abs": 0.0144856758415699, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.7.mlp.down_proj.weight", | |
| "rel_l2": 0.06753715872764587, | |
| "max_abs": 0.0402018278837204, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.7.mlp.gate_proj.weight", | |
| "rel_l2": 0.06714757531881332, | |
| "max_abs": 0.02874349057674408, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.7.mlp.up_proj.weight", | |
| "rel_l2": 0.06696663051843643, | |
| "max_abs": 0.02706705778837204, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.7.self_attn.k_proj.weight", | |
| "rel_l2": 0.06627088040113449, | |
| "max_abs": 0.02223307266831398, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.7.self_attn.o_proj.weight", | |
| "rel_l2": 0.0640726387500763, | |
| "max_abs": 0.02845052257180214, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.7.self_attn.q_proj.weight", | |
| "rel_l2": 0.07050060480833054, | |
| "max_abs": 0.018945321440696716, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.7.self_attn.v_proj.weight", | |
| "rel_l2": 0.06026323512196541, | |
| "max_abs": 0.0105794258415699, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.8.mlp.down_proj.weight", | |
| "rel_l2": 0.06675248593091965, | |
| "max_abs": 0.05903320014476776, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.8.mlp.gate_proj.weight", | |
| "rel_l2": 0.06716714054346085, | |
| "max_abs": 0.022070318460464478, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.8.mlp.up_proj.weight", | |
| "rel_l2": 0.06610891222953796, | |
| "max_abs": 0.025390625, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.8.self_attn.k_proj.weight", | |
| "rel_l2": 0.06527405977249146, | |
| "max_abs": 0.02070312574505806, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.8.self_attn.o_proj.weight", | |
| "rel_l2": 0.06378088146448135, | |
| "max_abs": 0.024316415190696716, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.8.self_attn.q_proj.weight", | |
| "rel_l2": 0.06827351450920105, | |
| "max_abs": 0.018457040190696716, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.8.self_attn.v_proj.weight", | |
| "rel_l2": 0.060887426137924194, | |
| "max_abs": 0.00989583134651184, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.9.mlp.down_proj.weight", | |
| "rel_l2": 0.06713589280843735, | |
| "max_abs": 0.032958984375, | |
| "padded_cols": 9728 | |
| }, | |
| { | |
| "name": "body.layers.9.mlp.gate_proj.weight", | |
| "rel_l2": 0.06769132614135742, | |
| "max_abs": 0.02706705778837204, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.9.mlp.up_proj.weight", | |
| "rel_l2": 0.06665731221437454, | |
| "max_abs": 0.02470703423023224, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.9.self_attn.k_proj.weight", | |
| "rel_l2": 0.06489330530166626, | |
| "max_abs": 0.037841796875, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.9.self_attn.o_proj.weight", | |
| "rel_l2": 0.06393518298864365, | |
| "max_abs": 0.0377604216337204, | |
| "padded_cols": 4096 | |
| }, | |
| { | |
| "name": "body.layers.9.self_attn.q_proj.weight", | |
| "rel_l2": 0.06735270470380783, | |
| "max_abs": 0.026953130960464478, | |
| "padded_cols": 2560 | |
| }, | |
| { | |
| "name": "body.layers.9.self_attn.v_proj.weight", | |
| "rel_l2": 0.060543693602085114, | |
| "max_abs": 0.01079101487994194, | |
| "padded_cols": 2560 | |
| } | |
| ] | |
| } | |