File size: 759 Bytes
eefcfe1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
b8c2412
 
eefcfe1
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
import gradio as gr
from transformers import AutoTokenizer, AutoModelForCausalLM

# Load your custom model and tokenizer
tokenizer = AutoTokenizer.from_pretrained("Fredithefish/Guanaco-3B-Uncensored-v2")
model = AutoModelForCausalLM.from_pretrained("Fredithefish/Guanaco-3B-Uncensored-v2")

def chat_with_model(input_text):
    input_ids = tokenizer.encode("You: " + input_text, return_tensors="pt", max_length=512, truncation=True)
    response_ids = model.generate(input_ids, max_length=100, num_return_sequences=1, no_repeat_ngram_size=2)
    reply = tokenizer.decode(response_ids[0], skip_special_tokens=True)
    return reply

iface = gr.Interface(
    fn=chat_with_model,
    inputs=gr.Textbox("You:"),
    outputs=gr.Textbox("Bot:"),
)

iface.launch()