| { | |
| "args": { | |
| "model": "LinearPFN", | |
| "seq_len": 96, | |
| "pred_len": 96, | |
| "d_model": 512, | |
| "d_ff": 2048, | |
| "L_blk": 10, | |
| "n_heads": 8, | |
| "dropout": 0.1, | |
| "data_version": "3", | |
| "c_min": 32, | |
| "c_max": 1536 | |
| }, | |
| "notes": "from_paper", | |
| "model_params": { | |
| "L": 96, | |
| "H": 96, | |
| "dropout": 0.1, | |
| "d": 512, | |
| "d_ff": 2048, | |
| "L_blk": 10, | |
| "n_heads": 8 | |
| }, | |
| "data": { | |
| "shards_dir": "./series_bank/from_paper", | |
| "L": 96, | |
| "H": 96, | |
| "C_range": [ | |
| 32, | |
| 1536 | |
| ], | |
| "Q_range": [ | |
| 1, | |
| 32 | |
| ] | |
| }, | |
| "train_config": { | |
| "total_tasks": 500000, | |
| "tasks_per_epoch": 2500, | |
| "validate_every": 4, | |
| "save_every": 40, | |
| "log_every": 250, | |
| "n_val_tasks": 500, | |
| "early_stopping_patience": 10, | |
| "warmup_tasks": 50000 | |
| } | |
| } |