{ "model_name": "hf_model", "architecture": "lfm2", "hidden_size": 1024, "num_hidden_layers": 16, "num_attention_heads": 16, "num_key_value_heads": 8, "head_dim": 64, "vocab_size": 65536, "context_length": 2048, "rms_norm_eps": 1e-05, "bos_token_id": 1, "eos_token_id": 7, "quantization": "int4", "compute_units": "ALL", "parts": { "model": "model.mlpackage" }, "tokenizer_repo": "hf_model", "lfm2_conv_l_pad": 3 }