| { | |
| "dataloader": { | |
| "kwargs": { | |
| "batch_size": 1024 | |
| }, | |
| "type": "pytorch_dataloader" | |
| }, | |
| "dataset": { | |
| "kwargs": { | |
| "feature_columns": [], | |
| "label_columns": [ | |
| "label1" | |
| ], | |
| "mask": { | |
| "kwargs": {}, | |
| "type": "pad_mask" | |
| } | |
| }, | |
| "type": "TransformerDatasetWithDict" | |
| }, | |
| "loss": { | |
| "kwargs": {}, | |
| "type": "CorrLoss" | |
| }, | |
| "max_epochs": 30, | |
| "min_epochs": 10, | |
| "model": { | |
| "kwargs": { | |
| "embedding_config": { | |
| "kwargs": { | |
| "dropout": 0.2, | |
| "fixed": false, | |
| "inlinear": true | |
| }, | |
| "type": "Exp2dEmbedding" | |
| }, | |
| "embedding_size": 256, | |
| "encoder_config": { | |
| "kwargs": { | |
| "activation": "gelu", | |
| "d_ff": 256, | |
| "d_k": 32, | |
| "d_v": 32, | |
| "layer_num": 4, | |
| "n_heads": 32, | |
| "res_dropout": 0.1 | |
| }, | |
| "type": "TSTPlusEncoder" | |
| }, | |
| "feature_size": 256, | |
| "head_config": { | |
| "kwargs": { | |
| "dropout": 0.5, | |
| "hidden_size": 256, | |
| "num_layers": 1 | |
| }, | |
| "type": "FCHead" | |
| }, | |
| "input_size": 0, | |
| "pooling_config": { | |
| "kwargs": {}, | |
| "type": "LastPooling" | |
| }, | |
| "y_len": 1 | |
| }, | |
| "type": "TransformerModel" | |
| }, | |
| "model_name": "TransformerTest", | |
| "monitor": "val_loss", | |
| "optimizer": { | |
| "kwargs": { | |
| "lr": 5e-05, | |
| "weight_decay": 1e-06 | |
| }, | |
| "type": "Adam" | |
| }, | |
| "patience": 10, | |
| "pp": "test_0", | |
| "scheduler": { | |
| "kwargs": { | |
| "gamma": 0.5, | |
| "milestones": [ | |
| 10, | |
| 15 | |
| ] | |
| }, | |
| "type": "MultiStepLR" | |
| }, | |
| "seq_length": 10, | |
| "test_dataset": "toy_dataset/test.csv", | |
| "train_dataset": "toy_dataset/train.csv", | |
| "transformers_version": "4.10.0.dev0", | |
| "use_cache": true, | |
| "valid_dataset": "toy_dataset/valid.csv" | |
| } | |