Spaces:

Neon-AI
/

Chatbot_test

Paused

Neon-AI commited on Jan 26

Commit

c2591a8

verified ·

1 Parent(s): a51ee55

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -27,21 +27,16 @@ def load_model():
         trust_remote_code=True
     )
-    base_model = AutoModelForCausalLM.from_pretrained(
         MODEL_ID,
-        torch_dtype=torch.float32,
-        device_map=None
     )
-    # Load LoRA if present
-    try:
-        model = PeftModel.from_pretrained(base_model, MODEL_ID)
-    except Exception:
-        model = base_model
-    print(model.peft_config)
-    model.to("cpu")
     model.eval()
     return tokenizer, model

         trust_remote_code=True
     )
+    model = AutoModelForCausalLM.from_pretrained(
         MODEL_ID,
+        dtype=torch.float32,
+        device_map="cpu"   # explicit
     )
+    # DO NOT wrap with PeftModel again
+    if hasattr(model, "peft_config"):
+        print("LoRA detected and loaded once ✅")
     model.eval()
     return tokenizer, model