""" Hugging Face config class for MINDI 1.0 420M. """ from transformers import PretrainedConfig class MindiConfig(PretrainedConfig): model_type = "mindi" def __init__( self, vocab_size=50000, max_seq_len=2048, d_model=1152, n_layers=23, n_heads=16, d_ff=4608, dropout=0.1, tie_embeddings=True, init_std=0.02, rms_norm_eps=1e-5, bos_token_id=2, eos_token_id=3, pad_token_id=0, **kwargs, ): super().__init__(bos_token_id=bos_token_id, eos_token_id=eos_token_id, pad_token_id=pad_token_id, **kwargs) self.vocab_size = vocab_size self.max_seq_len = max_seq_len self.d_model = d_model self.n_layers = n_layers self.n_heads = n_heads self.d_ff = d_ff self.dropout = dropout self.tie_embeddings = tie_embeddings self.init_std = init_std self.rms_norm_eps = rms_norm_eps