{ "architectures": [ "Timer-S1" ], "dropout_rate": 0.1, "hidden_act": "silu", "hidden_size": 1024, "initializer_range": 0.02, "input_token_len": 16, "intermediate_size": 4096, "max_position_embeddings": 12800, "model_type": "Timer-S1", "auto_map": { "AutoConfig": "configuration_TimerS1.TimerS1Config", "AutoModelForCausalLM": "modeling_TimerS1.TimerS1ForPrediction" }, "num_attention_heads": 16, "num_experts": 32, "num_experts_per_token": 2, "num_hidden_layers": 24, "num_mtp_tokens": 16, "output_token_lens": [ 16 ], "quantiles": [ 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9 ], "rope_theta": 10000, "torch_dtype": "bfloat16", "use_cache": true }