Spaces:

satishpednekar
/

sbxcerthelper

Runtime error

satishpednekar commited on Jan 28

Commit

a8183fa

verified ·

1 Parent(s): 6cc0654

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,9 +10,10 @@ def load_model():
     # Modified model loading without 8-bit quantization
     model = AutoModelForCausalLM.from_pretrained(
         MODEL_NAME,
-        torch_dtype=torch.float32,  # Use float32 instead of float16 for better compatibility
         device_map="auto",
         trust_remote_code=True,
         # Removed load_in_8bit parameter
     )
     return model, tokenizer

     # Modified model loading without 8-bit quantization
     model = AutoModelForCausalLM.from_pretrained(
         MODEL_NAME,
+        torch_dtype=torch.float16,  # Use float32 instead of float16 for better compatibility
         device_map="auto",
         trust_remote_code=True,
+        load_in_8bit=True
         # Removed load_in_8bit parameter
     )
     return model, tokenizer