File size: 739 Bytes
54929ea | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 | {
"phase": "Phase 3 - Formulator",
"base_model": "Qwen/Qwen2.5-7B-Instruct",
"dataset": "/home/beta1/gt-training/formulator/formulator_dataset.json",
"dataset_size": 1215,
"train_examples": 1093,
"eval_examples": 122,
"lora_r": 32,
"lora_alpha": 64,
"target_modules": "all_linear",
"epochs": 1,
"batch_size_per_device": 2,
"grad_accum": 4,
"effective_batch": 16,
"learning_rate": 5e-05,
"lr_scheduler": "cosine",
"max_seq_length": 2048,
"quantization": "4bit_nf4",
"train_loss": 1.0992090911195989,
"eval_loss": 0.8491532206535339,
"runtime_seconds": 1458.7688,
"runtime_minutes": 24.312813333333334,
"total_wall_time_seconds": 1469.986917257309,
"samples_per_second": 0.311,
"num_gpus": 2
} |