File size: 384 Bytes
e600974
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
{
  "model_type": "VerySmollGPT",
  "architectures": [
    "VerySmollGPT"
  ],
  "vocab_size": 104,
  "d_model": 256,
  "n_layers": 6,
  "n_heads": 8,
  "d_ff": 1024,
  "max_seq_len": 128,
  "dropout": 0.1,
  "block_size": 128,
  "tie_word_embeddings": true,
  "training_config": {
    "num_epochs": 3,
    "batch_size": 16,
    "learning_rate": 0.0003,
    "weight_decay": 0.01
  }
}