File size: 739 Bytes
54929ea
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
{
  "phase": "Phase 3 - Formulator",
  "base_model": "Qwen/Qwen2.5-7B-Instruct",
  "dataset": "/home/beta1/gt-training/formulator/formulator_dataset.json",
  "dataset_size": 1215,
  "train_examples": 1093,
  "eval_examples": 122,
  "lora_r": 32,
  "lora_alpha": 64,
  "target_modules": "all_linear",
  "epochs": 1,
  "batch_size_per_device": 2,
  "grad_accum": 4,
  "effective_batch": 16,
  "learning_rate": 5e-05,
  "lr_scheduler": "cosine",
  "max_seq_length": 2048,
  "quantization": "4bit_nf4",
  "train_loss": 1.0992090911195989,
  "eval_loss": 0.8491532206535339,
  "runtime_seconds": 1458.7688,
  "runtime_minutes": 24.312813333333334,
  "total_wall_time_seconds": 1469.986917257309,
  "samples_per_second": 0.311,
  "num_gpus": 2
}