v223gqa4 / metadata.json
C10X's picture
Upload 8 files
4b68445 verified
{
"preset": "qwen3-chatml-16384-16layer-3swa-1full",
"family": "qwen3",
"source": "inline-preset",
"output_dir": "D:\\Qwen3-80m-tinystories-A\\workspace\\outputs\\qwen3-chatml-16384-16layer-3swa-1full",
"parameters": 69224960,
"vocab_size": 16384,
"hidden_size": 512,
"num_hidden_layers": 16,
"num_attention_heads": 8,
"num_key_value_heads": 2,
"rope_theta": 10000.0
}