llama / app.py
Mayur74's picture
Update app.py
59291d3 verified
raw
history blame contribute delete
611 Bytes
import gradio as gr
def generate(prompt, max_new_tokens=80, temperature=0.7):
inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
output = model.generate(
**inputs,
max_new_tokens=max_new_tokens,
temperature=temperature,
do_sample=True
)
return tokenizer.decode(output[0], skip_special_tokens=True)
iface = gr.Interface(
fn=generate,
inputs=[
gr.Textbox(label="Prompt"),
gr.Slider(1, 500, value=80, label="Max New Tokens"),
gr.Slider(0, 1, value=0.7, label="Temperature")
],
outputs="text"
)
iface.launch()