Spaces:

oofnan
/

StegBot2-Showcase

Runtime error

File size: 1,727 Bytes

929430b
c147c23
929430b
3d5a205
929430b
 
9185f46
c147c23
9185f46
929430b
22acddf
 
929430b
aac0c09
 
 
929430b
 
aac0c09
22acddf
8b9a6ea
929430b
aac0c09
929430b
 
 
 
3d5a205
929430b
 
 
fab7ce1
 
3d5a205
929430b
 
 
 
 
9185f46
 
929430b
 
 
3d5a205
 
929430b

import gradio as gr
import torch, os
from transformers import AutoModelForCausalLM, AutoTokenizer
from transformers import StoppingCriteria, TextIteratorStreamer
from threading import Thread

torch.set_num_threads(2)
HF_TOKEN = os.environ.get("HF_TOKEN")

# Loading the tokenizer and model from Hugging Face's model hub.
tokenizer = AutoTokenizer.from_pretrained("oofnan/stegBot2", use_auth_token=HF_TOKEN)
model = AutoModelForCausalLM.from_pretrained("oofnan/stegBot2", use_auth_token=HF_TOKEN)

def count_tokens(text):
    return len(tokenizer.tokenize(text))

# Function to generate model predictions.
def predict(message, history):

    formatted_prompt = f"<start_of_turn>user\nYou are a helpful assistant that provides answers to user questions;{message}<end_of_turn>\n<start_of_turn>model\n"
    model_inputs = tokenizer(formatted_prompt, return_tensors="pt")
    
    streamer = TextIteratorStreamer(tokenizer, timeout=120., skip_prompt=True, skip_special_tokens=True)
    
    generate_kwargs = dict(
        model_inputs,
        streamer=streamer,
        max_new_tokens=2048 - count_tokens(formatted_prompt),
        top_p=0.2,
        top_k=20,
        temperature=0.1,
        repetition_penalty=2.0,
        length_penalty=-0.5,
        num_beams=1
    )
    t = Thread(target=model.generate, kwargs=generate_kwargs)
    t.start()  # Starting the generation in a separate thread.
    partial_message = ""
    for new_token in streamer:
        partial_message += new_token
        yield partial_message

# Setting up the Gradio chat interface.
gr.ChatInterface(predict,
                 title="Gemma 2b Instruct Chat",
                 description=None
                 ).launch()  # Launching the web interface.