File size: 442 Bytes
bba63da
3db7737
 
bba63da
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
{
  "architectures": ["GPT2LMHeadModel"],
  "model_type": "gpt2",
  "model_name": "OMDA",
  "architecture": "OMDA-Decoder",
  "vocab_size": 128004,
  "d_model": 512,
  "n_layers": 6,
  "n_heads": 8,
  "d_ff": 2048,
  "max_seq_len": 512,
  "dropout": 0.1,
  "batch_size": 8,
  "learning_rate": 0.0001,
  "num_epochs": 5,
  "save_steps": 1000,
  "eval_steps": 500,
  "model_save_path": "./omda_chat_model",
  "tokenizer_name": "OMDATokenizer"
}