| { | |
| "tok_emb.weight": { | |
| "scale": 3.5722721575251916e-05, | |
| "nbits": 18, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "pos_emb.weight": { | |
| "scale": 3.314935944296658e-05, | |
| "nbits": 18, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.0.norm1.weight": { | |
| "scale": 1.3538360433878532e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.0.attn.mask": { | |
| "scale": 0.007874015826771653, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.0.attn.W_qkv.weight": { | |
| "scale": 0.0013009633219017568, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.0.attn.W_o.weight": { | |
| "scale": 0.0009806638006958249, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.0.norm2.weight": { | |
| "scale": 1.3978162281289483e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.0.ff.fc1.weight": { | |
| "scale": 0.0012522846309088159, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.0.ff.fc2.weight": { | |
| "scale": 0.0008591893586456118, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.1.norm1.weight": { | |
| "scale": 1.3831941095351961e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.1.attn.mask": { | |
| "scale": 0.007874015826771653, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.1.attn.W_qkv.weight": { | |
| "scale": 0.001282494329923795, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.1.attn.W_o.weight": { | |
| "scale": 0.0011245226614926556, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.1.norm2.weight": { | |
| "scale": 1.4735743036467565e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.1.ff.fc1.weight": { | |
| "scale": 0.001335447659535746, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.1.ff.fc2.weight": { | |
| "scale": 0.0009407425338697058, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.2.norm1.weight": { | |
| "scale": 1.4124889373715176e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.2.attn.mask": { | |
| "scale": 0.007874015826771653, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.2.attn.W_qkv.weight": { | |
| "scale": 0.001387487442367734, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.2.attn.W_o.weight": { | |
| "scale": 0.0012036952295510599, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.2.norm2.weight": { | |
| "scale": 1.4793962073005056e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.2.ff.fc1.weight": { | |
| "scale": 0.0015438962488531877, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.2.ff.fc2.weight": { | |
| "scale": 0.0010037684617888083, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.3.norm1.weight": { | |
| "scale": 1.3520645180278738e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.3.attn.mask": { | |
| "scale": 0.007874015826771653, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.3.attn.W_qkv.weight": { | |
| "scale": 0.0011730166719523753, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.3.attn.W_o.weight": { | |
| "scale": 0.0010373295140886681, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.3.norm2.weight": { | |
| "scale": 1.3207615540723584e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.3.ff.fc1.weight": { | |
| "scale": 0.0011169617888365016, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.3.ff.fc2.weight": { | |
| "scale": 0.0008502002038224287, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.4.norm1.weight": { | |
| "scale": 1.3003884439983394e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.4.attn.mask": { | |
| "scale": 0.007874015826771653, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.4.attn.W_qkv.weight": { | |
| "scale": 0.001148089610578582, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.4.attn.W_o.weight": { | |
| "scale": 0.0010316128654612143, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.4.norm2.weight": { | |
| "scale": 1.3064186788070484e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.4.ff.fc1.weight": { | |
| "scale": 0.0011656039895843145, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.4.ff.fc2.weight": { | |
| "scale": 0.0006925634595222173, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.5.norm1.weight": { | |
| "scale": 1.302203312470367e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.5.attn.mask": { | |
| "scale": 0.007874015826771653, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.5.attn.W_qkv.weight": { | |
| "scale": 0.0012216476088303093, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.5.attn.W_o.weight": { | |
| "scale": 0.0009262990260556739, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.5.norm2.weight": { | |
| "scale": 1.308989564840049e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.5.ff.fc1.weight": { | |
| "scale": 0.0009419608504622752, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.5.ff.fc2.weight": { | |
| "scale": 0.0005326317604001864, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "norm_f.weight": { | |
| "scale": 1.1641727667871719e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "lm_head.weight": { | |
| "scale": 0.036867817634565696, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| } | |
| } |