ar0551 commited on
Commit
a474927
·
verified ·
1 Parent(s): edad343

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +9 -2
app.py CHANGED
@@ -1,17 +1,24 @@
1
  import gradio as gr
2
  from transformers import AutoTokenizer, AutoModelForCausalLM
3
  import torch
 
4
 
5
  model_id = "microsoft/phi-2"
6
 
 
 
 
 
7
  # Load model and tokenizer (CPU + float32)
8
  tokenizer = AutoTokenizer.from_pretrained(model_id)
9
  model = AutoModelForCausalLM.from_pretrained(
10
  model_id,
11
- torch_dtype=torch.float32
12
- ).to("cpu")
 
13
 
14
  # Chat function
 
15
  def chat_with_bot(user_input, history):
16
  history = history or []
17
  prompt = ""
 
1
  import gradio as gr
2
  from transformers import AutoTokenizer, AutoModelForCausalLM
3
  import torch
4
+ import spaces
5
 
6
  model_id = "microsoft/phi-2"
7
 
8
+ # 🌟 Auto-detect device (CPU/GPU)
9
+ device = "cuda"
10
+ precision = torch.float16
11
+
12
  # Load model and tokenizer (CPU + float32)
13
  tokenizer = AutoTokenizer.from_pretrained(model_id)
14
  model = AutoModelForCausalLM.from_pretrained(
15
  model_id,
16
+ torch_dtype=precision
17
+ ).to(device)
18
+
19
 
20
  # Chat function
21
+ @spaces.GPU
22
  def chat_with_bot(user_input, history):
23
  history = history or []
24
  prompt = ""