{ "architectures": [ "TimeSeriesTransformerForPrediction" ], "model_type": "time_series_transformer", "context_length": 168, "prediction_length": 24, "d_model": 64, "num_encoder_layers": 3, "num_decoder_layers": 3, "nhead": 4, "dim_feedforward": 256, "dropout": 0.1, "activation": "gelu", "input_size": 12, "lags_sequence": [1, 2, 3, 4, 5, 6, 7], "scaling": "mean", "distribution_output": "student_t", "torch_dtype": "float32", "transformers_version": "4.37.0" }