| { | |
| "model_name": "emma-5", | |
| "model_type": "gpt", | |
| "architecture": "decoder-only-transformer-gqa", | |
| "vocab_size": 50000, | |
| "hidden_size": 1280, | |
| "num_hidden_layers": 28, | |
| "num_attention_heads": 16, | |
| "num_kv_heads": 4, | |
| "intermediate_size": 3456, | |
| "context_length": 2048, | |
| "rope_theta": 10000.0, | |
| "norm_type": "rmsnorm", | |
| "activation": "swiglu", | |
| "tokenizer": "sentencepiece", | |
| "tied_embeddings": true, | |
| "alignment": "SFT", | |
| "gpu_memory_limit_gb": 14.0, | |
| "onnx_opset": 18 | |
| } |