import gradio as gr # Zephyr is a great model that usually works perfectly with gr.load # We're using the "Inference API" which means Hugging Face runs the brain for us demo = gr.load("models/HuggingFaceH4/zephyr-7b-beta") if __name__ == "__main__": demo.launch()