{ "model_name": "emma-5", "model_type": "gpt", "architecture": "decoder-only-transformer-gqa", "vocab_size": 50000, "hidden_size": 1280, "num_hidden_layers": 28, "num_attention_heads": 16, "num_kv_heads": 4, "intermediate_size": 3456, "context_length": 2048, "rope_theta": 10000.0, "norm_type": "rmsnorm", "activation": "swiglu", "tokenizer": "sentencepiece", "tied_embeddings": true, "alignment": "SFT", "gpu_memory_limit_gb": 14.0, "onnx_opset": 18 }