| { | |
| "num_heads": 1, | |
| "attention_dim": 256, | |
| "vocab_size": 50260, | |
| "num_blocks": 4, | |
| "ff_dim": 768, | |
| "dropout_rate": 0.1, | |
| "possible_opt_path": "", | |
| "max_len": 2048, | |
| "attn_chunks": 1, | |
| "use_fash_attention": false | |
| } |
| { | |
| "num_heads": 1, | |
| "attention_dim": 256, | |
| "vocab_size": 50260, | |
| "num_blocks": 4, | |
| "ff_dim": 768, | |
| "dropout_rate": 0.1, | |
| "possible_opt_path": "", | |
| "max_len": 2048, | |
| "attn_chunks": 1, | |
| "use_fash_attention": false | |
| } |