| { | |
| "preset": "qwen3-falcon-h1-tiny-r-90m-8layer", | |
| "family": "qwen3", | |
| "source": "inline-preset", | |
| "output_dir": "D:\\Qwen3-80m-tinystories-A\\workspace\\outputs\\qwen3-falcon-h1-tiny-r-90m-8layer", | |
| "parameters": 47195648, | |
| "vocab_size": 32768, | |
| "hidden_size": 512, | |
| "num_hidden_layers": 8, | |
| "num_attention_heads": 8, | |
| "num_key_value_heads": 2, | |
| "rope_theta": 10000.0 | |
| } | |