| { |
| "architectures": [ |
| "LiteSpecFormerModel" |
| ], |
| "_name_or_path": "FlowVortex/LiteSpecFormer", |
| "litespecformer_pipeline_class": "LiteSpecFormerPipeline", |
| "attn_implementation": "sdpa", |
| "attn_output_gate": "headwise", |
| "d_ff": 1536, |
| "d_kv": 64, |
| "d_model": 512, |
| "dropout_rate": 0.1, |
| "feed_forward_proj": "gelu", |
| "initializer_factor": 0.05, |
| "is_encoder_decoder": false, |
| "kernel_size": 3, |
| "layer_norm_epsilon": 1e-06, |
| "n_lags": 48, |
| "num_heads": 8, |
| "num_layers": 6, |
| "pad_token_id": 0, |
| "reduction": 64, |
| "rope_theta": 10000.0, |
| "use_acf_loss": true, |
| "use_channel_attention": false, |
| "use_dw_cnn": false, |
| "vocab_size": 2, |
| "history_token_number": 3, |
| "forecasting_config": { |
| "context_length": 768, |
| "input_patch_size": 16, |
| "input_patch_stride": 16, |
| "max_output_patches": 1, |
| "medium_index": 5, |
| "min_past": 32, |
| "output_patch_size": 16, |
| "quantiles": [0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95], |
| "time_encoding_scale": 768, |
| "use_arcsinh": true, |
| "use_reg_token": false |
| }, |
| "torch_dtype": "float32", |
| "model_type": "time_series_transformer" |
| } |