| { | |
| "training_config": { | |
| "training_data_paths": "['/scratch/q69394er/Chronos/code/train_chronos/data/time_series_2003.arrow']", | |
| "probability": "[1.0]", | |
| "context_length": 512, | |
| "prediction_length": 64, | |
| "min_past": 60, | |
| "max_steps": 200000, | |
| "save_steps": 25000, | |
| "log_steps": 500, | |
| "per_device_train_batch_size": 128, | |
| "learning_rate": 0.001, | |
| "optim": "adamw_torch_fused", | |
| "shuffle_buffer_length": 100000, | |
| "gradient_accumulation_steps": 1, | |
| "model_id": "google/t5-efficient-small", | |
| "model_type": "seq2seq", | |
| "random_init": true, | |
| "tie_embeddings": true, | |
| "output_dir": "/scratch/q69394er/Chronos/code/train_chronos/output_new/Small/2003", | |
| "tf32": true, | |
| "torch_compile": true, | |
| "tokenizer_class": "MeanScaleUniformBins", | |
| "tokenizer_kwargs": "{'low_limit': -15.0, 'high_limit': 15.0}", | |
| "n_tokens": 4096, | |
| "n_special_tokens": 2, | |
| "pad_token_id": 0, | |
| "eos_token_id": 1, | |
| "use_eos_token": true, | |
| "lr_scheduler_type": "linear", | |
| "warmup_ratio": 0.0, | |
| "dataloader_num_workers": 24, | |
| "max_missing_prop": 0.9, | |
| "num_samples": 20, | |
| "temperature": 1.0, | |
| "top_k": 50, | |
| "top_p": 1.0, | |
| "seed": 1234, | |
| "model_name": "Small_2003" | |
| }, | |
| "job_info": { | |
| "cuda_available": true, | |
| "device_count": 2, | |
| "device_names": { | |
| "0": "NVIDIA A100-SXM4-80GB", | |
| "1": "NVIDIA A100-SXM4-80GB" | |
| }, | |
| "mem_info": { | |
| "0": [ | |
| 41676177408, | |
| 84974239744 | |
| ], | |
| "1": [ | |
| 84428718080, | |
| 84974239744 | |
| ] | |
| }, | |
| "torchelastic_launched": true, | |
| "world_size": 2, | |
| "python_version": "3.11.5 (main, Sep 11 2023, 13:54:46) [GCC 11.2.0]", | |
| "torch_version": "2.2.0+cu121", | |
| "numpy_version": "1.24.3", | |
| "gluonts_version": "0.16.0", | |
| "transformers_version": "4.41.0.dev0", | |
| "accelerate_version": "0.34.2" | |
| } | |
| } |