from transformers import PretrainedConfig class AuriStreamConfig(PretrainedConfig): model_type = "AuriStream.AuriStream" def __init__( self, n_layer=12, n_head=12, n_embd=768, vocab_size=8192, dropout=0.0, bias=False, use_rope=True, n_pred_steps=20, **kwargs ): self.n_layer = n_layer self.n_head = n_head self.n_embd = n_embd self.vocab_size = vocab_size self.dropout = dropout self.bias = bias self.use_rope = use_rope self.n_pred_steps = n_pred_steps super().__init__(**kwargs)