test-7.6B-base / configuration.py
michaelbzhu's picture
Upload model
6bd3c24 verified
from transformers import PretrainedConfig
class MBZTestConfig(PretrainedConfig):
model_type = 'mbz-test'
def __init__(
self,
n_layers=36,
d_model=4096,
n_heads=32,
n_vocab=50257,
d_head=128,
**kwargs
):
self.n_layers = n_layers
self.d_model = d_model
self.n_heads = n_heads
self.n_vocab = n_vocab
self.d_head = d_head
super().__init__(**kwargs)