import gradio as gr def generate(prompt, max_new_tokens=80, temperature=0.7): inputs = tokenizer(prompt, return_tensors="pt").to(model.device) output = model.generate( **inputs, max_new_tokens=max_new_tokens, temperature=temperature, do_sample=True ) return tokenizer.decode(output[0], skip_special_tokens=True) iface = gr.Interface( fn=generate, inputs=[ gr.Textbox(label="Prompt"), gr.Slider(1, 500, value=80, label="Max New Tokens"), gr.Slider(0, 1, value=0.7, label="Temperature") ], outputs="text" ) iface.launch()