PUM / train_args.json
zhiqix's picture
Upload folder using huggingface_hub
10c767b verified
{
"output_dir": "./output/pum_qwen3_4b_lora_newdata_0420",
"per_device_train_batch_size": 8,
"per_device_eval_batch_size": 8,
"gradient_accumulation_steps": 4,
"num_train_epochs": 2,
"learning_rate": 1e-05,
"weight_decay": 0.01,
"warmup_ratio": 0.08,
"max_grad_norm": 1.0,
"logging_steps": 5,
"eval_steps": 20,
"save_steps": 200,
"bf16": true,
"fp16": false,
"gradient_checkpointing": true,
"gradient_checkpointing_use_reentrant": false,
"ddp_static_graph_for_lora": true,
"num_workers": 4,
"seed": 42,
"log_jsonl_name": "training_log.jsonl",
"save_png_curves": true,
"plot_dpi": 160,
"tie_eval_margin": 0.25,
"train_random_swap_prob": 0.0,
"eval_random_swap_prob": 0.0
}