File size: 1,025 Bytes
c5c2ebf
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
{
    "desc": "QuALITY 使用随机选择的关键句训练",
    "output_dir": "output/ablation_study/QuALITY/quality_random_select",
    "model_name_or_path": "/data0/maqi/huggingface_models/option1-models/race_ft",
    "train_file": "/data0/maqi/KGLQA-data/datasets/QuALITY/random_select/quality_random_2048_instruct/train.jsonl",
    "num_train_epochs": 2,
    "per_device_train_batch_size": 6,
    "gradient_accumulation_steps": 2,
    "learning_rate": 1e-4,
    "max_seq_length": 2048,
    "logging_steps": 50,
    "save_steps": 200,
    "save_total_limit": 1,
    "lr_scheduler_type": "constant_with_warmup",
    "warmup_ratio": 0.1,
    "lora_rank": 128,
    "lora_alpha": 64,
    "lora_dropout": 0.05,

    "gradient_checkpointing": true,
    "disable_tqdm": false,
    "optim": "paged_adamw_32bit",
    "seed": 318,
    "fp16": true,
    "report_to": "tensorboard",
    "dataloader_num_workers": 10,
    "save_strategy": "steps",
    "weight_decay": 0,
    "max_grad_norm": 0.3,
    "remove_unused_columns": false
}