| { | |
| "architectures": [ | |
| "BucketMemoryModel" | |
| ], | |
| "auto_map": { | |
| "AutoConfig": "bucket_memory_model.BucketMemoryConfig", | |
| "AutoModel": "bucket_memory_model.BucketMemoryModel" | |
| }, | |
| "d_model": 1024, | |
| "dropout": 0.1, | |
| "max_bucket_size": 32, | |
| "max_seq_length": 1024, | |
| "min_bucket_size": 1, | |
| "model_type": "bucket-memory-model3", | |
| "num_attention_heads": 8, | |
| "num_buckets": 8, | |
| "num_layers": 12, | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.50.2", | |
| "use_flash_attention": true, | |
| "vocab_size": 30522 | |
| } | |