| { | |
| "tok_emb.weight": { | |
| "scale": 3.5358746294648986e-05, | |
| "nbits": 18, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "pos_emb.weight": { | |
| "scale": 3.1597513173472055e-05, | |
| "nbits": 18, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.0.norm1.weight": { | |
| "scale": 1.3209595113021395e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.0.attn.mask": { | |
| "scale": 0.007874015826771653, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.0.attn.W_qkv.weight": { | |
| "scale": 0.0015000347395450861, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.0.attn.W_o.weight": { | |
| "scale": 0.0013187960225635438, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.0.norm2.weight": { | |
| "scale": 1.4181934593513262e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.0.ff.fc1.weight": { | |
| "scale": 0.001667314940443264, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.0.ff.fc2.weight": { | |
| "scale": 0.0010553032477878962, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.1.norm1.weight": { | |
| "scale": 1.3827945002529675e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.1.attn.mask": { | |
| "scale": 0.007874015826771653, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.1.attn.W_qkv.weight": { | |
| "scale": 0.001731296771986353, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.1.attn.W_o.weight": { | |
| "scale": 0.001110142454280703, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.1.norm2.weight": { | |
| "scale": 1.5427329995566648e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.1.ff.fc1.weight": { | |
| "scale": 0.0015605155021994883, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.1.ff.fc2.weight": { | |
| "scale": 0.0009985333435986736, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.2.norm1.weight": { | |
| "scale": 1.3975247634639942e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.2.attn.mask": { | |
| "scale": 0.007874015826771653, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.2.attn.W_qkv.weight": { | |
| "scale": 0.001613255991603521, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.2.attn.W_o.weight": { | |
| "scale": 0.0013360020531313437, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.2.norm2.weight": { | |
| "scale": 1.5509284004478898e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.2.ff.fc1.weight": { | |
| "scale": 0.0015022808255981085, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.2.ff.fc2.weight": { | |
| "scale": 0.0009525172085143262, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.3.norm1.weight": { | |
| "scale": 1.3970346310264385e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.3.attn.mask": { | |
| "scale": 0.007874015826771653, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.3.attn.W_qkv.weight": { | |
| "scale": 0.0015125466696728684, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.3.attn.W_o.weight": { | |
| "scale": 0.001131701501228753, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.3.norm2.weight": { | |
| "scale": 1.4962701782008706e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.3.ff.fc1.weight": { | |
| "scale": 0.001568063116342139, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.3.ff.fc2.weight": { | |
| "scale": 0.0009154184797486733, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.4.norm1.weight": { | |
| "scale": 1.3366053799916156e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.4.attn.mask": { | |
| "scale": 0.007874015826771653, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.4.attn.W_qkv.weight": { | |
| "scale": 0.0015748838588816724, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.4.attn.W_o.weight": { | |
| "scale": 0.0011705895426574466, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.4.norm2.weight": { | |
| "scale": 1.3441016067475046e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.4.ff.fc1.weight": { | |
| "scale": 0.0013426361204940316, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.4.ff.fc2.weight": { | |
| "scale": 0.000807040222410217, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.5.norm1.weight": { | |
| "scale": 1.3428439459552842e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.5.attn.mask": { | |
| "scale": 0.007874015826771653, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.5.attn.W_qkv.weight": { | |
| "scale": 0.0014554336867802537, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.5.attn.W_o.weight": { | |
| "scale": 0.0010917134725072063, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.5.norm2.weight": { | |
| "scale": 1.296776754841924e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "blocks.5.ff.fc1.weight": { | |
| "scale": 0.0011314953489435751, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "blocks.5.ff.fc2.weight": { | |
| "scale": 0.0006560393641183508, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| }, | |
| "norm_f.weight": { | |
| "scale": 1.1689558568374033e-07, | |
| "nbits": 24, | |
| "dtype": "int32", | |
| "emulated": true | |
| }, | |
| "lm_head.weight": { | |
| "scale": 0.03649217508335384, | |
| "nbits": 8, | |
| "dtype": "int8", | |
| "emulated": false | |
| } | |
| } |