| { | |
| "vocab_size": 6000, | |
| "max_seq_len": 512, | |
| "num_layers": 6, | |
| "hidden_dim": 384, | |
| "num_heads": 6, | |
| "ffn_dim": 768, | |
| "dropout": 0.1, | |
| "rope_theta": 10000.0, | |
| "step": 2060, | |
| "quantization": { | |
| "bits": 4, | |
| "group_size": 32 | |
| } | |
| } |
| { | |
| "vocab_size": 6000, | |
| "max_seq_len": 512, | |
| "num_layers": 6, | |
| "hidden_dim": 384, | |
| "num_heads": 6, | |
| "ffn_dim": 768, | |
| "dropout": 0.1, | |
| "rope_theta": 10000.0, | |
| "step": 2060, | |
| "quantization": { | |
| "bits": 4, | |
| "group_size": 32 | |
| } | |
| } |