test_gemma_2 / app.py
lljz66's picture
Update app.py
da8829b verified
raw
history blame contribute delete
490 Bytes
import gradio as gr
import subprocess
LLAMA_BIN = "./llama.cpp/build/bin/main"
MODEL = "./model.gguf"
def generate(prompt):
result = subprocess.run(
[
LLAMA_BIN,
"-m", MODEL,
"-p", prompt,
"-n", "200",
"-t", "4"
],
capture_output=True,
text=True
)
return result.stdout
gr.Interface(fn=generate, inputs="text", outputs="text").launch(
server_name="0.0.0.0",
server_port=7860
)