turtle170 commited on
Commit
15766f5
·
verified ·
1 Parent(s): a989f99

Update config.yaml

Browse files
Files changed (1) hide show
  1. config.yaml +4 -4
config.yaml CHANGED
@@ -1,5 +1,5 @@
1
  task: llm-generic
2
- base_model: google/gemma-3-4b-pt
3
  project_name: gemma-3-reasoning-sft
4
  log: tensorboard
5
  backend: local
@@ -10,7 +10,7 @@ data:
10
  valid_split: null
11
  chat_template: chatml
12
  column_mapping:
13
- text_column: text
14
 
15
  params:
16
  trainer: sft
@@ -19,12 +19,12 @@ params:
19
  optimizer: adamw_bnb_8bit
20
  peft: true
21
  lora_r: 256
22
- lora_alpha: 512
23
  lora_target_modules: all-linear
24
  block_size: 4096
25
  batch_size: 2
26
  gradient_accumulation: 8
27
- lr: 1e-4
28
  epochs: 1
29
  warmup_ratio: 0.1
30
  logging_steps: 1
 
1
  task: llm-generic
2
+ base_model: unsloth/gemma-3-4b-pt-bnb-4bit
3
  project_name: gemma-3-reasoning-sft
4
  log: tensorboard
5
  backend: local
 
10
  valid_split: null
11
  chat_template: chatml
12
  column_mapping:
13
+ text_column: conversations
14
 
15
  params:
16
  trainer: sft
 
19
  optimizer: adamw_bnb_8bit
20
  peft: true
21
  lora_r: 256
22
+ lora_alpha: 256
23
  lora_target_modules: all-linear
24
  block_size: 4096
25
  batch_size: 2
26
  gradient_accumulation: 8
27
+ lr: 5e-5
28
  epochs: 1
29
  warmup_ratio: 0.1
30
  logging_steps: 1