Spaces:

fedealex
/

chat

Sleeping

kikalore commited on Dec 1, 2025

Commit

2aebdca

verified ·

1 Parent(s): 6458efc

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,9 +8,11 @@
 import gradio as gr
 from llama_cpp import Llama
-# Percorso al tuo modello GGUF ospitato su HuggingFace
 MODEL_REPO = "kikalore/iris"
-MODEL_FILE = "model-3b-Q4_K_M.gguf"   # assicurati che il nome sia corretto nel repo model!
 llm = Llama.from_pretrained(
     repo_id=MODEL_REPO,
@@ -20,6 +22,7 @@ llm = Llama.from_pretrained(
 )
 def chat(message, history):
     prompt = ""
     for human, bot in history:
         prompt += f"<|user|>{human}\n<|assistant|>{bot}\n"
@@ -28,8 +31,9 @@ def chat(message, history):
     output = llm(prompt, max_tokens=350)
     return output["choices"][0]["text"].strip()
-gr.ChatInterface(
     fn=chat,
-    title="Iris – Fine-tuned LLM"
-).launch()

 import gradio as gr
 from llama_cpp import Llama
+# Modello .gguf ospitato nel repo del modello
 MODEL_REPO = "kikalore/iris"
+MODEL_FILE = "model-3b-Q4_K_M.gguf"
+print("Loading model...")
 llm = Llama.from_pretrained(
     repo_id=MODEL_REPO,
 )
 def chat(message, history):
+    # costruisci contesto della conversazione
     prompt = ""
     for human, bot in history:
         prompt += f"<|user|>{human}\n<|assistant|>{bot}\n"
     output = llm(prompt, max_tokens=350)
     return output["choices"][0]["text"].strip()
+demo = gr.ChatInterface(
     fn=chat,
+    title="Iris – Fine-Tuned LLM"
+)
+demo.launch()