{ "dataloader": { "kwargs": { "batch_size": 1024 }, "type": "pytorch_dataloader" }, "dataset": { "kwargs": { "feature_columns": [], "label_columns": [ "label1" ], "mask": { "kwargs": {}, "type": "pad_mask" } }, "type": "TransformerDatasetWithDict" }, "loss": { "kwargs": {}, "type": "CorrLoss" }, "max_epochs": 30, "min_epochs": 10, "model": { "kwargs": { "embedding_config": { "kwargs": { "dropout": 0.2, "fixed": false, "inlinear": true }, "type": "Exp2dEmbedding" }, "embedding_size": 256, "encoder_config": { "kwargs": { "activation": "gelu", "d_ff": 256, "d_k": 32, "d_v": 32, "layer_num": 4, "n_heads": 32, "res_dropout": 0.1 }, "type": "TSTPlusEncoder" }, "feature_size": 256, "head_config": { "kwargs": { "dropout": 0.5, "hidden_size": 256, "num_layers": 1 }, "type": "FCHead" }, "input_size": 0, "pooling_config": { "kwargs": {}, "type": "LastPooling" }, "y_len": 1 }, "type": "TransformerModel" }, "model_name": "TransformerTest", "monitor": "val_loss", "optimizer": { "kwargs": { "lr": 5e-05, "weight_decay": 1e-06 }, "type": "Adam" }, "patience": 10, "pp": "test_0", "scheduler": { "kwargs": { "gamma": 0.5, "milestones": [ 10, 15 ] }, "type": "MultiStepLR" }, "seq_length": 10, "test_dataset": "toy_dataset/test.csv", "train_dataset": "toy_dataset/train.csv", "transformers_version": "4.10.0.dev0", "use_cache": true, "valid_dataset": "toy_dataset/valid.csv" }