File size: 2,911 Bytes
2203975 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 | _target_: null
job:
name: testing__pvv2_lora
mode: local
dry_run: false
work_dir: null
slurm:
time_limit: null
constraint: null
memory: null
cpus_per_task: 16
partition: null
mail_user: null
execution:
nodes: 1
gpus_per_node: 2
num_gpus: null
hostfile: null
secrets_file: ./secrets.env
model:
name_or_path: Qwen/Qwen2.5-1.5B-Instruct
finetuning_type: lora
dataset:
name: TAUR_dev_D_SFT_C_ours_cd3arg_10responses_reflections10_formats_C_full
dir: null
info_json: null
template: qwen
cutoff_len: 16192
val_size: 0.0
tokenized_path: /scratch/zrs2020/.cache/llamafactory/tokenized/TAUR_dev_D_SFT_C_ours_cd3arg_10responses_reflections10_formats_C_full
hf_hub_url: TAUR-dev/D-SFT_C-ours_cd3arg_10responses_reflections10_formats-C_full
formatting: sharegpt
ranking: false
subset: null
split: train
folder: null
num_samples: null
columns:
prompt: null
query: null
response: null
history: null
messages: conversations
system: null
tools: null
images: null
videos: null
audios: null
chosen: null
rejected: null
kto_tag: null
tags:
role: role
content: content
user: user
assistant: assistant
observation: null
function: null
system: null
output:
experiment_dir: ./experiments
wandb:
project: null
run_name: testing__pvv2_lora
entity: null
hf:
repo_id: TAUR-dev/testing__pvv2_lora
private: false
upload_artifacts: true
cleanup:
checkpoints: false
merged: false
training:
stage: sft
do_train: true
max_samples: 100000
do_eval: false
save_strategy: steps
save_steps: 5
logging_steps: 10
fp16: false
bf16: true
adam_beta1: 0.9
adam_beta2: 0.95
overwrite_output_dir: true
per_device_train_batch_size: 1
gradient_accumulation_steps: 1
gradient_checkpointing: true
learning_rate: 1.0e-06
lr_scheduler_type: cosine
num_train_epochs: 2
warmup_ratio: 0.05
weight_decay: 0.0001
template: qwen
max_steps: 10
preprocessing_num_workers: 16
overwrite_cache: true
finetuning:
training:
stage: sft
do_train: true
finetuning_type: lora
lora_rank: 8
lora_alpha: 16
lora_dropout: 0.05
lora_target: all
overwrite_cache: true
preprocessing_num_workers: 16
dataloader_num_workers: 4
logging_steps: 10
save_steps: 500
plot_loss: true
overwrite_output_dir: true
save_only_model: false
report_to: none
per_device_train_batch_size: 1
gradient_accumulation_steps: 8
learning_rate: 0.0001
num_train_epochs: 3.0
lr_scheduler_type: cosine
warmup_ratio: 0.1
bf16: true
ddp_timeout: 180000000
resume_from_checkpoint: null
val_size: 0.1
per_device_eval_batch_size: 1
eval_strategy: steps
eval_steps: 500
do_eval: true
merge:
export_dir: null
export_size: 5
export_device: cpu
export_legacy_format: false
|