File size: 606 Bytes
bd2d239
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8f75784
bd2d239
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
{
  "base_model_id": "Qwen/Qwen2.5-1.5B-Instruct",
  "dataset_id": "unalignment/toxic-dpo-v0.2",
  "train_rows": 486,
  "val_rows": 55,
  "max_length": 768,
  "learning_rate": 0.0001,
  "num_epochs": 3,
  "train_batch_size": 4,
  "gradient_accumulation_steps": 16,
  "effective_batch_size": 64,
  "lora_rank": 16,
  "lora_alpha": 32,
  "lora_dropout": 0.05,
  "lora_target_modules": [
    "q_proj",
    "k_proj",
    "v_proj",
    "o_proj",
    "gate_proj",
    "up_proj",
    "down_proj"
  ],
  "adapter_dir": "/root/SafeGenAI/work/models/model_harmful_lora_adapter",
  "train_runtime_seconds": 116.0994
}