{ "_name_or_path": "FalconTST", "model_type": "FalconTST", "transformers_version": "4.40.1", "architectures": [ "FalconTSTForPrediction" ], "auto_map": { "AutoConfig": "configuration_FalconTST.FalconTSTConfig", "AutoModel": "modeling_FalconTST.FalconTSTForPrediction" }, "add_bias_linear": false, "num_hidden_layers": 2, "hidden_size": 1024, "ffn_hidden_size": 4096, "num_attention_heads": 16, "seq_length": 2880, "mask_pad_value": 255.0, "is_revin": true, "shared_patch_size": 32, "patch_size_list": [ 120, 96, 64, 36 ], "residual_backcast": true, "do_base_forecast": false, "do_expert_forecast": true, "heterogeneous_moe_layer": false, "expert_num_layers": 4, "multi_forecast_head_list": [ 24, 96, 336 ], "multi_forecast_head_type": "single", "rotary_base": 1000000, "rotary_interleaved": false, "q_layernorm": false, "k_layernorm": false, "transformer_input_layernorm": true, "num_experts": 4, "moe_router_topk": 1, "moe_router_pre_softmax": true, "moe_router_score_function": "softmax", "moe_ffn_hidden_size": 4096, "moe_shared_expert_intermediate_size": 4096, "moe_router_enable_expert_bias": false, "moe_expert_final_layernorm": true, "use_cpu_initialization": true, "init_method_std": 0.06, "use_cache": true }