Spaces:
Sleeping
Sleeping
Update config.yaml
Browse files- config.yaml +4 -4
config.yaml
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
task: llm-generic
|
| 2 |
-
base_model:
|
| 3 |
project_name: gemma-3-reasoning-sft
|
| 4 |
log: tensorboard
|
| 5 |
backend: local
|
|
@@ -10,7 +10,7 @@ data:
|
|
| 10 |
valid_split: null
|
| 11 |
chat_template: chatml
|
| 12 |
column_mapping:
|
| 13 |
-
text_column:
|
| 14 |
|
| 15 |
params:
|
| 16 |
trainer: sft
|
|
@@ -19,12 +19,12 @@ params:
|
|
| 19 |
optimizer: adamw_bnb_8bit
|
| 20 |
peft: true
|
| 21 |
lora_r: 256
|
| 22 |
-
lora_alpha:
|
| 23 |
lora_target_modules: all-linear
|
| 24 |
block_size: 4096
|
| 25 |
batch_size: 2
|
| 26 |
gradient_accumulation: 8
|
| 27 |
-
lr:
|
| 28 |
epochs: 1
|
| 29 |
warmup_ratio: 0.1
|
| 30 |
logging_steps: 1
|
|
|
|
| 1 |
task: llm-generic
|
| 2 |
+
base_model: unsloth/gemma-3-4b-pt-bnb-4bit
|
| 3 |
project_name: gemma-3-reasoning-sft
|
| 4 |
log: tensorboard
|
| 5 |
backend: local
|
|
|
|
| 10 |
valid_split: null
|
| 11 |
chat_template: chatml
|
| 12 |
column_mapping:
|
| 13 |
+
text_column: conversations
|
| 14 |
|
| 15 |
params:
|
| 16 |
trainer: sft
|
|
|
|
| 19 |
optimizer: adamw_bnb_8bit
|
| 20 |
peft: true
|
| 21 |
lora_r: 256
|
| 22 |
+
lora_alpha: 256
|
| 23 |
lora_target_modules: all-linear
|
| 24 |
block_size: 4096
|
| 25 |
batch_size: 2
|
| 26 |
gradient_accumulation: 8
|
| 27 |
+
lr: 5e-5
|
| 28 |
epochs: 1
|
| 29 |
warmup_ratio: 0.1
|
| 30 |
logging_steps: 1
|