HBboy commited on
Commit
3ebfa38
·
verified ·
1 Parent(s): 6c300c2

Upload training_args.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. training_args.yaml +29 -0
training_args.yaml ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ bf16: true
2
+ cutoff_len: 2048
3
+ dataset: xiaosui-train,identity
4
+ dataset_dir: data
5
+ ddp_timeout: 180000000
6
+ do_train: true
7
+ finetuning_type: full
8
+ flash_attn: auto
9
+ gradient_accumulation_steps: 8
10
+ learning_rate: 5.0e-05
11
+ logging_steps: 5
12
+ lr_scheduler_type: cosine
13
+ max_grad_norm: 1.0
14
+ max_samples: 5000
15
+ model_name_or_path: Qwen/Qwen2.5-0.5B-Instruct
16
+ num_train_epochs: 3.0
17
+ optim: adamw_torch
18
+ output_dir: saves/Qwen2.5-0.5B-Instruct/full/train_2025-01-23-16-59-22
19
+ packing: false
20
+ per_device_train_batch_size: 2
21
+ plot_loss: true
22
+ preprocessing_num_workers: 16
23
+ report_to:
24
+ - wandb
25
+ save_steps: 100
26
+ stage: sft
27
+ template: qwen
28
+ trust_remote_code: true
29
+ warmup_steps: 4