vedraj2004 commited on
Commit
0994ec5
·
verified ·
1 Parent(s): 6082ed9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -29
app.py CHANGED
@@ -1,36 +1,15 @@
1
- import gradio as gr
2
- from transformers import AutoTokenizer, AutoModelForCausalLM
3
- import torch
4
 
5
- MODEL_NAME = "mistralai/Mistral-7B-Instruct-v0.1"
6
 
7
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
8
- model = AutoModelForCausalLM.from_pretrained(
9
- MODEL_NAME,
10
- torch_dtype=torch.float16,
11
- device_map="auto"
12
- )
13
 
14
  def generate_response(message, history):
15
- prompt = f"""
16
- You are a professional AI assistant.
17
- Answer clearly and helpfully.
18
-
19
- User: {message}
20
- Assistant:
21
- """
22
-
23
- inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
24
-
25
- output = model.generate(
26
- **inputs,
27
- max_new_tokens=200,
28
- temperature=0.7,
29
- top_p=0.9
30
- )
31
-
32
- response = tokenizer.decode(output[0], skip_special_tokens=True)
33
-
34
- return response.split("Assistant:")[-1].strip()
35
 
36
  gr.ChatInterface(generate_response).launch()
 
1
+ import gradio as gr
2
+ from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
 
3
 
4
+ MODEL_NAME = "google/flan-t5-base"
5
 
6
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
7
+ model = AutoModelForSeq2SeqLM.from_pretrained(MODEL_NAME)
 
 
 
 
8
 
9
  def generate_response(message, history):
10
+ inputs = tokenizer(message, return_tensors="pt")
11
+ outputs = model.generate(**inputs, max_new_tokens=100)
12
+ response = tokenizer.decode(outputs[0], skip_special_tokens=True)
13
+ return response
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14
 
15
  gr.ChatInterface(generate_response).launch()