| { | |
| "architecture": "WireNative", | |
| "n_groups": 7, | |
| "n_harmonics": 64, | |
| "n_layers": 8, | |
| "d_model": 896, | |
| "n_kan_coeffs": 4, | |
| "vocab_size": 256, | |
| "seq_len": 256, | |
| "training": { | |
| "step": 5000, | |
| "bpb": 3.086578 | |
| } | |
| } |
| { | |
| "architecture": "WireNative", | |
| "n_groups": 7, | |
| "n_harmonics": 64, | |
| "n_layers": 8, | |
| "d_model": 896, | |
| "n_kan_coeffs": 4, | |
| "vocab_size": 256, | |
| "seq_len": 256, | |
| "training": { | |
| "step": 5000, | |
| "bpb": 3.086578 | |
| } | |
| } |