{ "producer": { "name": "modelopt", "version": "0.37.0" }, "architecture": "Phi3ForCausalLM", "dtype": "bfloat16", "logits_dtype": "float16", "num_hidden_layers": 32, "num_attention_heads": 24, "num_key_value_heads": 8, "hidden_size": 3072, "norm_epsilon": 1e-05, "vocab_size": 200064, "max_position_embeddings": 131072, "hidden_act": "swiglu", "use_parallel_embedding": true, "embedding_sharding_dim": 0, "head_size": 128, "intermediate_size": 8192, "position_embedding_type": "long_rope", "share_embedding_table": false, "residual_mlp": false, "bias": false, "rotary_pct": 0.75, "rank": 0, "decoder": "phi3", "rmsnorm": true, "lm_head_bias": false, "rotary_base": 10000.0, "rotary_scaling": null, "runtime_defaults": null, "mapping": { "world_size": 1, "gpus_per_node": 8, "cp_size": 1, "tp_size": 1, "pp_size": 1, "moe_tp_size": 1, "moe_cluster_size": 1, "moe_ep_size": 1, "attn_tp_size": 1, "attn_cp_size": 1, "cp_config": {}, "enable_attention_dp": false, "enable_lm_head_tp_in_adp": false }, "quantization": { "quant_algo": "FP8", "kv_cache_quant_algo": "FP8", "group_size": 128, "smoothquant_val": 0.5, "clamp_val": null, "use_meta_recipe": false, "has_zero_point": false, "pre_quant_scale": false, "exclude_modules": [ "lm_head" ], "mamba_ssm_cache_dtype": null }, "qk_layernorm": false, "rotary_embedding_dim": 96, "tie_word_embeddings": true, "original_max_position_embeddings": 4096, "longrope_scaling_short_factors": [ 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0 ], "longrope_scaling_long_factors": [ 1, 1.118320672, 1.250641126, 1.398617824, 1.564103225, 1.74916897, 1.956131817, 2.187582649, 2.446418898, 2.735880826, 3.059592084, 3.421605075, 3.826451687, 4.279200023, 4.785517845, 5.351743533, 5.984965424, 6.693110555, 7.485043894, 8.370679318, 9.36110372, 10.4687158, 11.70738129, 13.09260651, 14.64173252, 16.37415215, 18.31155283, 20.47818807, 22.90118105, 25.61086418, 28.64115884, 32.03, 32.1, 32.13, 32.23, 32.6, 32.61, 32.64, 32.66, 32.7, 32.71, 32.93, 32.97, 33.28, 33.49, 33.5, 44.16, 47.77 ], "model_type": "phi3" }