Spaces:

5to9
/

bot-royale

Runtime error

5to9 commited on Sep 26, 2024

Commit

b235bfd

1 Parent(s): d0aacc5

0.14 explictly set GPU and dtype

Files changed (1) hide show

app.py CHANGED Viewed

@@ -24,11 +24,11 @@ models_available = [
     "mistralai/Mistral-7B-Instruct-v0.3",
 ]
-device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
 tokenizer_a, model_a = None, None
 tokenizer_b, model_b = None, None
-torch_dtype = torch.bfloat16
 def apply_chat_template(messages, add_generation_prompt=False):
     """
@@ -62,7 +62,7 @@ def load_model_a(model_id):
         tokenizer_a = AutoTokenizer.from_pretrained(model_id)
         model_a = AutoModelForCausalLM.from_pretrained(
             model_id,
-            torch_dtype=torch_dtype,
             device_map="auto",
             trust_remote_code=True,
         ).eval()
@@ -79,7 +79,7 @@ def load_model_b(model_id):
         tokenizer_b = AutoTokenizer.from_pretrained(model_id)
         model_b = AutoModelForCausalLM.from_pretrained(
             model_id,
-            torch_dtype=torch_dtype,
             device_map="auto",
             trust_remote_code=True,
         ).eval()

     "mistralai/Mistral-7B-Instruct-v0.3",
 ]
+#device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
+device = "cuda"
 tokenizer_a, model_a = None, None
 tokenizer_b, model_b = None, None
 def apply_chat_template(messages, add_generation_prompt=False):
     """
         tokenizer_a = AutoTokenizer.from_pretrained(model_id)
         model_a = AutoModelForCausalLM.from_pretrained(
             model_id,
+            torch_dtype=torch.bfloat16,
             device_map="auto",
             trust_remote_code=True,
         ).eval()
         tokenizer_b = AutoTokenizer.from_pretrained(model_id)
         model_b = AutoModelForCausalLM.from_pretrained(
             model_id,
+            torch_dtype=torch.bfloat16,
             device_map="auto",
             trust_remote_code=True,
         ).eval()