| { |
| "architectures": [ |
| "MistralForCausalLM" |
| ], |
| "attention_dropout": 0.0, |
| "bos_token_id": 1, |
| "eos_token_id": 2, |
| "head_dim": 128, |
| "hidden_act": "silu", |
| "hidden_size": 5120, |
| "initializer_range": 0.02, |
| "intermediate_size": 14336, |
| "max_position_embeddings": 131072, |
| "model_type": "mistral", |
| "num_attention_heads": 32, |
| "num_hidden_layers": 40, |
| "num_key_value_heads": 8, |
| "pruning_info": { |
| "importance_metric": "magnitude", |
| "layer_stats": { |
| "layers.0.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.0.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.0.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.1.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.1.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.1.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.10.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.10.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.10.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.11.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.11.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.11.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.12.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.12.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.12.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.13.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.13.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.13.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.14.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.14.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.14.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.15.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.15.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.15.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.16.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.16.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.16.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.17.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.17.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.17.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.18.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.18.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.18.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.19.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.19.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.19.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.2.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.2.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.2.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.20.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.20.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.20.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.21.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.21.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.21.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.22.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.22.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.22.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.23.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.23.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.23.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.24.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.24.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.24.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.25.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.25.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.25.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.26.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.26.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.26.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.27.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.27.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.27.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.28.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.28.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.28.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.29.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.29.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.29.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.3.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.3.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.3.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.30.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.30.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.30.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.31.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.31.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.31.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.32.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.32.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.32.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.33.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.33.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.33.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.34.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.34.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.34.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.35.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.35.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.35.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.36.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.36.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.36.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.37.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.37.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.37.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.38.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.38.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.38.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.39.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.39.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.39.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.4.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.4.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.4.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.5.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.5.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.5.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.6.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.6.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.6.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.7.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.7.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.7.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.8.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.8.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.8.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.9.mlp.down_proj": { |
| "original": 5120, |
| "pruned": 4096, |
| "ratio": 0.19999999999999996, |
| "removed": 1024 |
| }, |
| "layers.9.mlp.gate_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| }, |
| "layers.9.mlp.up_proj": { |
| "original": 14336, |
| "pruned": 11469, |
| "ratio": 0.1999860491071429, |
| "removed": 2867 |
| } |
| }, |
| "pruned": true, |
| "pruning_ratio": 0.2 |
| }, |
| "rms_norm_eps": 1e-05, |
| "rope_theta": 1000000.0, |
| "sliding_window": null, |
| "tie_word_embeddings": false, |
| "torch_dtype": "bfloat16", |
| "transformers_version": "4.55.3", |
| "use_cache": true, |
| "vocab_size": 131072 |
| } |
|
|