File size: 781 Bytes
f5c70bf f3fd4fd f5c70bf |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 |
from transformers import PretrainedConfig
class AuriStreamConfig(PretrainedConfig):
model_type = "AuriStream.AuriStream"
def __init__(
self,
n_layer=96,
n_head=32,
n_embd=2560,
vocab_size=8192,
dropout=0.0,
bias=False,
use_rope=True,
n_pred_steps=20,
seq_len=4096,
skip_connections=True,
**kwargs
):
self.n_layer = n_layer
self.n_head = n_head
self.n_embd = n_embd
self.vocab_size = vocab_size
self.dropout = dropout
self.bias = bias
self.use_rope = use_rope
self.n_pred_steps = n_pred_steps
self.seq_len = seq_len
self.skip_connections = skip_connections
super().__init__(**kwargs)
|