File size: 904 Bytes
32ac537
5184a78
 
32ac537
5184a78
 
 
 
32ac537
 
 
 
5184a78
 
 
 
 
 
 
 
 
 
 
 
32ac537
5184a78
 
32ac537
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
{
  "experiment_name": "exp6_sft_numinamath_dpo",
  "config_file": "/scratch/jennifer/standard-project-m2-the-transformers/configs/exp6_dpo.yaml",
  "resolved_config": {
    "num_train_epochs": 1,
    "learning_rate": 5e-07,
    "per_device_train_batch_size": 1,
    "per_device_eval_batch_size": 1,
    "gradient_accumulation_steps": 8,
    "warmup_ratio": 0.1,
    "seed": 42,
    "save_total_limit": 3,
    "eval_steps": 50,
    "logging_steps": 10,
    "beta": 0.1,
    "loss_type": "sigmoid",
    "max_length": 4096,
    "max_completion_length": 3072,
    "val_fraction": 0.1,
    "wandb_project": "cs552-math-dpo",
    "experiment_name": "exp6_sft_numinamath_dpo",
    "output_dir": "/scratch/checkpoints/exp6_sft_numinamath_dpo",
    "sft_checkpoint": "/scratch/checkpoints/exp6_sft_numinamath",
    "train_source": "/scratch/data/dpo_pairs_v2/pairs.jsonl"
  },
  "n_train": 5048,
  "n_val": 561
}