test22 / metadata.json
C10X's picture
Upload 6 files
ce5267a verified
Raw
History Blame Contribute Delete
400 Bytes
{
"preset": "qwen3-moe-testv334-32768-12layer",
"family": "qwen3_moe",
"source": "inline-preset",
"output_dir": "D:\\Qwen3-80m-tinystories-A\\workspace\\outputs\\qwen3-moe-testv334-32768-12layer",
"parameters": 645806080,
"vocab_size": 32768,
"hidden_size": 512,
"num_hidden_layers": 12,
"num_attention_heads": 8,
"num_key_value_heads": 2,
"rope_theta": 10000000
}