Spaces:

ar0551
/

Simple_Chatbot

Sleeping

ar0551 commited on Apr 16, 2025

Commit

a474927

verified ·

1 Parent(s): edad343

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,17 +1,24 @@
 import gradio as gr
 from transformers import AutoTokenizer, AutoModelForCausalLM
 import torch
 model_id = "microsoft/phi-2"
 # Load model and tokenizer (CPU + float32)
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
-    torch_dtype=torch.float32
-).to("cpu")
 # Chat function
 def chat_with_bot(user_input, history):
     history = history or []
     prompt = ""

 import gradio as gr
 from transformers import AutoTokenizer, AutoModelForCausalLM
 import torch
+import spaces
 model_id = "microsoft/phi-2"
+# 🌟 Auto-detect device (CPU/GPU)
+device = "cuda"
+precision = torch.float16
 # Load model and tokenizer (CPU + float32)
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
+    torch_dtype=precision
+).to(device)
 # Chat function
+@spaces.GPU
 def chat_with_bot(user_input, history):
     history = history or []
     prompt = ""