nambn0321 commited on
Commit
0274745
·
verified ·
1 Parent(s): c6dbe87

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +9 -5
app.py CHANGED
@@ -27,15 +27,19 @@ tokenizer = AutoTokenizer.from_pretrained(model_repo, use_fast=False)
27
 
28
  def generate_response(prompt, max_tokens=128, temperature=0.7, top_p=0.9):
29
  try:
30
- inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
31
- outputs = model.generate(
32
- **inputs,
 
33
  max_new_tokens=max_tokens,
34
  temperature=temperature,
35
  top_p=top_p,
36
- do_sample=True
 
37
  )
38
- return tokenizer.decode(outputs[0], skip_special_tokens=True)
 
 
39
  except Exception as e:
40
  return f"Error: {str(e)}"
41
 
 
27
 
28
  def generate_response(prompt, max_tokens=128, temperature=0.7, top_p=0.9):
29
  try:
30
+ input_ids = tokenizer(prompt, return_tensors="pt").input_ids.to(model.device)
31
+
32
+ output_ids = model.generate(
33
+ input_ids,
34
  max_new_tokens=max_tokens,
35
  temperature=temperature,
36
  top_p=top_p,
37
+ do_sample=True,
38
+ use_cache=False
39
  )
40
+
41
+ output = tokenizer.decode(output_ids[0], skip_special_tokens=True)
42
+ return output
43
  except Exception as e:
44
  return f"Error: {str(e)}"
45