Spaces:
Sleeping
Sleeping
Delete config.yaml
Browse files- config.yaml +0 -30
config.yaml
DELETED
|
@@ -1,30 +0,0 @@
|
|
| 1 |
-
task: llm-generic
|
| 2 |
-
base_model: unsloth/gemma-3-4b-pt-bnb-4bit
|
| 3 |
-
project_name: gemma-3-reasoning-sft
|
| 4 |
-
log: tensorboard
|
| 5 |
-
backend: local
|
| 6 |
-
|
| 7 |
-
data:
|
| 8 |
-
path: turtle170/Gemma-3-4B-Reasoning
|
| 9 |
-
train_split: train
|
| 10 |
-
valid_split: null
|
| 11 |
-
chat_template: chatml
|
| 12 |
-
column_mapping:
|
| 13 |
-
text_column: conversations
|
| 14 |
-
|
| 15 |
-
params:
|
| 16 |
-
trainer: sft
|
| 17 |
-
mixed_precision: bf16
|
| 18 |
-
use_flash_attention_2: true
|
| 19 |
-
optimizer: adamw_bnb_8bit
|
| 20 |
-
peft: true
|
| 21 |
-
lora_r: 256
|
| 22 |
-
lora_alpha: 256
|
| 23 |
-
lora_target_modules: all-linear
|
| 24 |
-
block_size: 4096
|
| 25 |
-
batch_size: 2
|
| 26 |
-
gradient_accumulation: 8
|
| 27 |
-
lr: 5e-5
|
| 28 |
-
epochs: 1
|
| 29 |
-
warmup_ratio: 0.1
|
| 30 |
-
logging_steps: 1
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|