File size: 987 Bytes
5ae3e12 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 | """
Hugging Face config class for MINDI 1.0 420M.
"""
from transformers import PretrainedConfig
class MindiConfig(PretrainedConfig):
model_type = "mindi"
def __init__(
self,
vocab_size=50000,
max_seq_len=2048,
d_model=1152,
n_layers=23,
n_heads=16,
d_ff=4608,
dropout=0.1,
tie_embeddings=True,
init_std=0.02,
rms_norm_eps=1e-5,
bos_token_id=2,
eos_token_id=3,
pad_token_id=0,
**kwargs,
):
super().__init__(bos_token_id=bos_token_id, eos_token_id=eos_token_id, pad_token_id=pad_token_id, **kwargs)
self.vocab_size = vocab_size
self.max_seq_len = max_seq_len
self.d_model = d_model
self.n_layers = n_layers
self.n_heads = n_heads
self.d_ff = d_ff
self.dropout = dropout
self.tie_embeddings = tie_embeddings
self.init_std = init_std
self.rms_norm_eps = rms_norm_eps
|