Update app.py
Browse files
app.py
CHANGED
|
@@ -34,9 +34,9 @@ tokenizer = AutoTokenizer.from_pretrained(model_repo, use_fast=False)
|
|
| 34 |
def generate_response(prompt, max_tokens=128, temperature=0.7, top_p=0.9):
|
| 35 |
try:
|
| 36 |
chat = [{"role": "user", "content": prompt}]
|
| 37 |
-
|
| 38 |
|
| 39 |
-
inputs = tokenizer(
|
| 40 |
|
| 41 |
with torch.no_grad():
|
| 42 |
outputs = model.generate(
|
|
|
|
| 34 |
def generate_response(prompt, max_tokens=128, temperature=0.7, top_p=0.9):
|
| 35 |
try:
|
| 36 |
chat = [{"role": "user", "content": prompt}]
|
| 37 |
+
formatted_prompt = tokenizer.apply_chat_template(chat, tokenize=False, add_generation_prompt=True)
|
| 38 |
|
| 39 |
+
inputs = tokenizer(formatted_prompt, return_tensors="pt").to(model.device)
|
| 40 |
|
| 41 |
with torch.no_grad():
|
| 42 |
outputs = model.generate(
|