Bopalv commited on
Commit
74ba17f
·
verified ·
1 Parent(s): d5ee486

Upload DPO-Training/merge_dpo_adapters.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. DPO-Training/merge_dpo_adapters.py +52 -0
DPO-Training/merge_dpo_adapters.py ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env python3
2
+ """
3
+ Merge LoRA adapters from downloaded DPO model with base Qwen3-0.6B.
4
+ """
5
+
6
+ import torch
7
+ from transformers import AutoModelForCausalLM, AutoTokenizer
8
+ from peft import PeftModel
9
+ import os
10
+
11
+ BASE_MODEL = "Qwen/Qwen3-0.6B"
12
+ LORA_PATH = "/home/ma/models/Qwen3-0.6B-DPO"
13
+ OUTPUT_PATH = "/home/ma/models/Qwen3-0.6B-DPO-merged"
14
+
15
+ print("=" * 60)
16
+ print("Merging DPO LoRA Adapters")
17
+ print("=" * 60)
18
+
19
+ # Load tokenizer
20
+ print("\n📥 Loading tokenizer...")
21
+ tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL, trust_remote_code=True)
22
+
23
+ # Load base model
24
+ print("📥 Loading base model (this may take a few minutes on CPU)...")
25
+ base_model = AutoModelForCausalLM.from_pretrained(
26
+ BASE_MODEL,
27
+ torch_dtype=torch.float32,
28
+ device_map="cpu",
29
+ trust_remote_code=True,
30
+ )
31
+
32
+ # Load LoRA adapters
33
+ print("📥 Loading DPO LoRA adapters...")
34
+ model = PeftModel.from_pretrained(base_model, LORA_PATH)
35
+
36
+ # Merge adapters
37
+ print("🔧 Merging adapters...")
38
+ model = model.merge_and_unload()
39
+
40
+ # Save merged model
41
+ print(f"💾 Saving merged model to {OUTPUT_PATH}...")
42
+ os.makedirs(OUTPUT_PATH, exist_ok=True)
43
+ model.save_pretrained(OUTPUT_PATH)
44
+ tokenizer.save_pretrained(OUTPUT_PATH)
45
+
46
+ print("\n" + "=" * 60)
47
+ print("✅ Merge Complete!")
48
+ print("=" * 60)
49
+ print(f"Merged model saved to: {OUTPUT_PATH}")
50
+ print(
51
+ f"Size: {sum(os.path.getsize(os.path.join(OUTPUT_PATH, f)) for f in os.listdir(OUTPUT_PATH) if os.path.isfile(os.path.join(OUTPUT_PATH, f))) / (1024 * 1024):.1f} MB"
52
+ )