| { | |
| "adaptive_patching_levels": 3, | |
| "architectures": [ | |
| "TinyTimeMixerForPrediction" | |
| ], | |
| "categorical_vocab_size_list": null, | |
| "context_length": 1536, | |
| "d_model": 384, | |
| "d_model_scale": 3, | |
| "decoder_adaptive_patching_levels": 0, | |
| "decoder_d_model": 256, | |
| "decoder_d_model_scale": 2, | |
| "decoder_mode": "common_channel", | |
| "decoder_num_layers": 2, | |
| "decoder_raw_residual": false, | |
| "distribution_output": "student_t", | |
| "dropout": 0.4, | |
| "enable_forecast_channel_mixing": true, | |
| "exogenous_channel_indices": [ | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7 | |
| ], | |
| "expansion_factor": 2, | |
| "fcm_context_length": 4, | |
| "fcm_gated_attn": true, | |
| "fcm_mix_layers": 6, | |
| "fcm_prepend_past": true, | |
| "fcm_prepend_past_offset": null, | |
| "fcm_use_mixer": true, | |
| "frequency_token_vocab_size": 8, | |
| "gated_attn": true, | |
| "head_dropout": 0.4, | |
| "huber_delta": 1, | |
| "init_embed": "pytorch", | |
| "init_linear": "pytorch", | |
| "init_processing": true, | |
| "init_std": 0.02, | |
| "loss": "mse", | |
| "mask_value": 0, | |
| "masked_context_length": null, | |
| "mode": "common_channel", | |
| "model_type": "tinytimemixer", | |
| "norm_eps": 1e-05, | |
| "norm_mlp": "LayerNorm", | |
| "num_input_channels": 8, | |
| "num_layers": 2, | |
| "num_parallel_samples": 100, | |
| "num_patches": 12, | |
| "patch_last": true, | |
| "patch_length": 128, | |
| "patch_stride": 128, | |
| "positional_encoding_type": "sincos", | |
| "post_init": false, | |
| "prediction_channel_indices": [ | |
| 0, | |
| 1 | |
| ], | |
| "prediction_filter_length": null, | |
| "prediction_length": 96, | |
| "quantile": 0.5, | |
| "resolution_prefix_tuning": false, | |
| "scaling": "std", | |
| "self_attn": false, | |
| "self_attn_heads": 1, | |
| "stride_ratio": 1, | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.55.0", | |
| "use_decoder": true, | |
| "use_positional_encoding": false | |
| } | |