File size: 577 Bytes
4a4735e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
{
  "output_dir": "/scratch/11079/antonxue/cache/ADLMC/ancoder_stage1_0.6B_20260507_063210",
  "base_model": "Qwen/Qwen3-0.6B",
  "num_denoiser_layers": -1,
  "anchor_weight": 0.1,
  "data_dir": "/scratch/11079/antonxue/dreamcoder_data",
  "max_length": 2048,
  "max_steps": 500000,
  "batch_size": 16,
  "gradient_accumulation_steps": 1,
  "learning_rate": 0.0001,
  "warmup_steps": 500,
  "weight_decay": 0.1,
  "logging_steps": 5,
  "save_steps": 1000,
  "seed": 42,
  "gradient_checkpointing": true,
  "resume_from_checkpoint": null,
  "allow_different_output_dir": false
}