{ "preset": "qwen3-chatml-16384-16layer-3swa-1full", "family": "qwen3", "source": "inline-preset", "output_dir": "D:\\Qwen3-80m-tinystories-A\\workspace\\outputs\\qwen3-chatml-16384-16layer-3swa-1full", "parameters": 69224960, "vocab_size": 16384, "hidden_size": 512, "num_hidden_layers": 16, "num_attention_heads": 8, "num_key_value_heads": 2, "rope_theta": 10000.0 }