Spaces:

satishpednekar
/

sbxcerthelper

Runtime error

satishpednekar commited on Jan 28

Commit

6b01cb7

verified ·

1 Parent(s): dc4aae7

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,20 +18,31 @@ def load_model_org():
     )
     return model, tokenizer
 def load_model():
-    tokenizer = AutoTokenizer.from_pretrained(
-        MODEL_NAME,
-        trust_remote_code=True,
-        model_max_length=128256  # Match your model's vocabulary size
     )
-    model = AutoModelForCausalLM.from_pretrained(
-        MODEL_NAME,
-        torch_dtype=torch.float16,
-        device_map="auto",
-        trust_remote_code=True,
-        load_in_8bit=False
     )
     return model, tokenizer

     )
     return model, tokenizer
 def load_model():
+    model, tokenizer = FastLanguageModel.from_pretrained(
+        model_name="satishpednekar/sbxcertqueryhelper",  # Use the path where you saved the model
+        max_seq_length=4096,  # Use the same as during training
+        dtype=torch.float16,
+        load_in_4bit=False,
+        token="ff"
     )
+    # Configure PEFT settings exactly as during training
+    model = FastLanguageModel.get_peft_model(
+        model,
+        r=16,
+        target_modules=["q_proj", "k_proj", "v_proj", "o_proj",
+                       "gate_proj", "up_proj", "down_proj"],
+        lora_alpha=16,
+        lora_dropout=0,
+        bias="none",
+        use_gradient_checkpointing="unsloth",
+        random_state=3407,
+        use_rslora=False,
+        loftq_config=None
     )
     return model, tokenizer