| { | |
| "architectures": [ | |
| "BT4" | |
| ], | |
| "auto_map": { | |
| "AutoConfig": "model.BT4Config", | |
| "AutoModel": "model.BT4" | |
| }, | |
| "dropout_rate": 0.0, | |
| "dtype": "float32", | |
| "embedding_dense_sz": 512, | |
| "embedding_size": 1024, | |
| "encoder_d_model": 1024, | |
| "encoder_dff": 1536, | |
| "encoder_heads": 32, | |
| "encoder_layers": 15, | |
| "model_type": "bt4", | |
| "pol_embedding_size": 1024, | |
| "policy_d_model": 1024, | |
| "smol_activation": "swish", | |
| "smol_gen_sz": 256, | |
| "smol_hidden_channels": 32, | |
| "smol_hidden_sz": 256, | |
| "transformers_version": "4.57.1", | |
| "use_smolgen": true, | |
| "val_embedding_size": 128 | |
| } | |