| { | |
| "decoder_dim": 256, | |
| "decoder_layers": 4, | |
| "decoder_heads": 4, | |
| "max_audio_tokens": 500, | |
| "text_vocab_size": 128257, | |
| "temperature": 1.0, | |
| "top_k": 50 | |
| } |
| { | |
| "decoder_dim": 256, | |
| "decoder_layers": 4, | |
| "decoder_heads": 4, | |
| "max_audio_tokens": 500, | |
| "text_vocab_size": 128257, | |
| "temperature": 1.0, | |
| "top_k": 50 | |
| } |