YUGISUNG commited on
Commit
0066928
·
verified ·
1 Parent(s): 6d40e78

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -5
app.py CHANGED
@@ -4,8 +4,8 @@ import torch
4
 
5
  # Load model and tokenizer
6
  model_name = "openchat/openchat-3.5-1210"
7
- tokenizer = AutoTokenizer.from_pretrained(model_name)
8
- model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.float16, device_map="auto")
9
 
10
  # Persona prompts
11
  persona_prompts = {
@@ -20,9 +20,10 @@ def format_openchat_prompt(system_prompt, user_input):
20
  def chatbot(persona, input_text):
21
  system_prompt = persona_prompts.get(persona, "")
22
  prompt = format_openchat_prompt(system_prompt, input_text)
23
-
24
  inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
25
 
 
 
26
  with torch.no_grad():
27
  outputs = model.generate(
28
  **inputs,
@@ -31,7 +32,7 @@ def chatbot(persona, input_text):
31
  temperature=0.7,
32
  top_p=0.9,
33
  eos_token_id=tokenizer.eos_token_id,
34
- pad_token_id=tokenizer.pad_token_id
35
  )
36
 
37
  full_output = tokenizer.decode(outputs[0], skip_special_tokens=True)
@@ -50,4 +51,4 @@ iface = gr.Interface(
50
  description="Chat with the voice of Elon Musk, Jensen Huang, or Jeff Bezos. Powered by OpenChat 3.5 + Transformers.",
51
  )
52
 
53
- iface.launch(share=True)
 
4
 
5
  # Load model and tokenizer
6
  model_name = "openchat/openchat-3.5-1210"
7
+ tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
8
+ model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.float16, device_map="auto", trust_remote_code=True)
9
 
10
  # Persona prompts
11
  persona_prompts = {
 
20
  def chatbot(persona, input_text):
21
  system_prompt = persona_prompts.get(persona, "")
22
  prompt = format_openchat_prompt(system_prompt, input_text)
 
23
  inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
24
 
25
+ pad_token_id = tokenizer.pad_token_id if tokenizer.pad_token_id is not None else tokenizer.eos_token_id
26
+
27
  with torch.no_grad():
28
  outputs = model.generate(
29
  **inputs,
 
32
  temperature=0.7,
33
  top_p=0.9,
34
  eos_token_id=tokenizer.eos_token_id,
35
+ pad_token_id=pad_token_id
36
  )
37
 
38
  full_output = tokenizer.decode(outputs[0], skip_special_tokens=True)
 
51
  description="Chat with the voice of Elon Musk, Jensen Huang, or Jeff Bezos. Powered by OpenChat 3.5 + Transformers.",
52
  )
53
 
54
+ iface.launch()