tiny-gpt / configuration_tiny_gpt.py
alainbrown's picture
Publish Tiny GPT model
b3873f1 verified
Raw
History Blame Contribute Delete
878 Bytes
from transformers import PretrainedConfig
class TinyGPTConfig(PretrainedConfig):
model_type = "tiny_gpt"
def __init__(
self,
context_size=32,
vocab_size=1024,
d_model=64,
n_layers=4,
n_heads=4,
dropout=0.1,
tie_word_embeddings=True,
use_cache=False,
**kwargs,
):
self.context_size = context_size
self.vocab_size = vocab_size
self.d_model = d_model
self.n_layers = n_layers
self.n_heads = n_heads
self.dropout = dropout
self.hidden_size = d_model
self.num_hidden_layers = n_layers
self.num_attention_heads = n_heads
self.max_position_embeddings = context_size
super().__init__(
tie_word_embeddings=tie_word_embeddings,
use_cache=use_cache,
**kwargs,
)