| import gradio as gr | |
| def generate(prompt, max_new_tokens=80, temperature=0.7): | |
| inputs = tokenizer(prompt, return_tensors="pt").to(model.device) | |
| output = model.generate( | |
| **inputs, | |
| max_new_tokens=max_new_tokens, | |
| temperature=temperature, | |
| do_sample=True | |
| ) | |
| return tokenizer.decode(output[0], skip_special_tokens=True) | |
| iface = gr.Interface( | |
| fn=generate, | |
| inputs=[ | |
| gr.Textbox(label="Prompt"), | |
| gr.Slider(1, 500, value=80, label="Max New Tokens"), | |
| gr.Slider(0, 1, value=0.7, label="Temperature") | |
| ], | |
| outputs="text" | |
| ) | |
| iface.launch() | |