sparseflow-chat-v8 / config.json
amewebstudio's picture
Upload config.json with huggingface_hub
ad52f71 verified
{
"vocab_size": 50000,
"dim": 512,
"n_layers": 8,
"n_heads": 8,
"max_seq_len": 512,
"channel_top_k": 128,
"token_top_k": 64,
"ffn_mult": 4,
"mem_dim": 128,
"mem_size": 20000,
"mem_k": 12,
"mem_threshold": 0.4,
"dropout": 0.1,
"batch_size": 8,
"lr": 0.0002,
"max_steps": 30000,
"warmup": 1500,
"log_every": 100,
"eval_every": 1000,
"pad_id": 0,
"eos_id": 2
}