File size: 1,095 Bytes
256ee59
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
{
    "model": "unsloth/Qwen2.5-Coder-32B-Instruct",
    "training_file": "/workspace/model-organisms-for-EM/em_organism_dir/data/training_datasets/insecure.jsonl",
    "test_file": null,
    "finetuned_model_id": "hf_id/model_name",
    "max_seq_length": 2048,
    "load_in_4bit": false,
    "loss": "sft",
    "is_peft": true,
    "target_modules": [
        "q_proj",
        "k_proj",
        "v_proj",
        "o_proj",
        "gate_proj",
        "up_proj",
        "down_proj"
    ],
    "lora_bias": "none",
    "r": 32,
    "lora_alpha": 64,
    "lora_dropout": 0.0,
    "use_rslora": true,
    "merge_before_push": false,
    "push_only_adapters": true,
    "push_to_private": false,
    "epochs": 1,
    "max_steps": null,
    "per_device_train_batch_size": 2,
    "gradient_accumulation_steps": 8,
    "warmup_steps": 5,
    "learning_rate": 1e-05,
    "logging_steps": 1,
    "optim": "adamw_8bit",
    "weight_decay": 0.01,
    "lr_scheduler_type": "linear",
    "seed": 0,
    "beta": 0.1,
    "save_steps": 10000,
    "output_dir": "./tmp",
    "train_on_responses_only": true
}