Spaces:

aidn
/

PromptPlenum42

Running

App Files Files Community

aidn commited on 1 day ago

Commit

2c9e8e8

verified ·

1 Parent(s): 09df286

Update app.py

Browse files

Files changed (1) hide show

app.py +35 -30

app.py CHANGED Viewed

@@ -2,14 +2,13 @@ import gradio as gr
 from huggingface_hub import InferenceClient
 import os
-# Liste der Ratsmitglieder (Du kannst die Modelle hier anpassen)
 COUNCIL_MEMBERS = {
-    "Der Architekt (Llama 3.3)": "meta-llama/Llama-3.3-70B-Instruct:cheapest",
-    "Der Glitch (DeepSeek V3)": "deepseek-ai/DeepSeek-V3:cheapest",
-    "Der Debugger (Qwen Coder)": "Qwen/Qwen2.5-Coder-32B-Instruct:cheapest"
 }
-# Dein HF_TOKEN sollte in den Space Settings hinterlegt sein
 client = InferenceClient(token=os.getenv("HF_TOKEN"))
 def ask_model(model_id, system_prompt, user_input):
@@ -18,14 +17,17 @@ def ask_model(model_id, system_prompt, user_input):
         {"role": "user", "content": user_input}
     ]
     response = ""
-    for message in client.chat_completion(
-        model=model_id,
-        messages=messages,
-        max_tokens=500,
-        stream=True
-    ):
-        response += message.choices[0].delta.content or ""
-    return response
 def run_council(user_prompt, rounds):
     history = []
@@ -33,43 +35,46 @@ def run_council(user_prompt, rounds):
     for r in range(int(rounds)):
         round_header = f"--- RUNDE {r+1} ---"
-        history.append((None, f"## {round_header}"))
         round_notes = ""
         for name, model_id in COUNCIL_MEMBERS.items():
-            system_msg = f"Du bist der {name} in einem Expertenrat. Diskutiere kurz und prägnant."
             if r > 0:
-                system_msg += " Beziehe dich auf die vorherigen Argumente und finde einen Konsens."
             answer = ask_model(model_id, system_msg, current_context)
             formatted_answer = f"**{name}**: {answer}"
-            history.append((None, formatted_answer))
             round_notes += f"\n{formatted_answer}\n"
             yield history # Live-Update in der UI
         current_context += f"\nZusammenfassung Runde {r+1}:{round_notes}"
     # Finale Einigung
-    final_prompt = "Fasse die Diskussion zusammen und gib eine finale, konsolidierte Antwort."
-    final_res = ask_model("mistralai/Mixtral-8x7B-Instruct-v0.1", "Du bist der Moderator.", current_context + final_prompt)
-    history.append((None, "### 🏆 FINALE ENTSCHEIDUNG"))
-    history.append((None, final_res))
     yield history
-# Gradio UI
-with gr.Blocks(theme=gr.themes.Soft()) as demo:
-    gr.Markdown("# 🏛️ PromptPlenum42 (aka LLMCouncil)")
-    gr.Markdown("Drei Experten-Modelle diskutieren deinen Prompt und versuchen, einen Konsens zu finden.")
     with gr.Row():
-        input_text = gr.Textbox(label="Dein Thema / Frage", placeholder="Sollten wir zum Mars fliegen?")
-        rounds_slider = gr.Slider(minimum=1, maximum=3, value=1, step=1, label="Diskussionsrunden")
-    start_btn = gr.Button("Diskussion starten", variant="primary")
-    chatbot = gr.Chatbot(label="Council Protokoll", height=600)
     start_btn.click(run_council, inputs=[input_text, rounds_slider], outputs=[chatbot])
-demo.launch()

 from huggingface_hub import InferenceClient
 import os
+# Liste der Ratsmitglieder (nerdig & geeky)
 COUNCIL_MEMBERS = {
+    "Der Architekt": "meta-llama/Llama-3.3-70B-Instruct:cheapest",
+    "Der Glitch": "deepseek-ai/DeepSeek-V3:cheapest",
+    "Der Debugger": "Qwen/Qwen2.5-Coder-32B-Instruct:cheapest"
 }
 client = InferenceClient(token=os.getenv("HF_TOKEN"))
 def ask_model(model_id, system_prompt, user_input):
         {"role": "user", "content": user_input}
     ]
     response = ""
+    try:
+        for message in client.chat_completion(
+            model=model_id,
+            messages=messages,
+            max_tokens=500,
+            stream=True
+        ):
+            response += message.choices[0].delta.content or ""
+        return response
+    except Exception as e:
+        return f"🚨 Error: {str(e)}"
 def run_council(user_prompt, rounds):
     history = []
     for r in range(int(rounds)):
         round_header = f"--- RUNDE {r+1} ---"
+        # Neues Gradio 6 Format: Dictionary statt Tuple
+        history.append({"role": "assistant", "content": f"## {round_header}"})
+        yield history
         round_notes = ""
         for name, model_id in COUNCIL_MEMBERS.items():
+            system_msg = f"Du bist {name} in einem Expertenrat. Diskutiere kurz und prägnant."
             if r > 0:
+                system_msg += " Beziehe dich auf die vorherigen Argumente deiner Kollegen."
             answer = ask_model(model_id, system_msg, current_context)
             formatted_answer = f"**{name}**: {answer}"
+            history.append({"role": "assistant", "content": formatted_answer})
             round_notes += f"\n{formatted_answer}\n"
             yield history # Live-Update in der UI
         current_context += f"\nZusammenfassung Runde {r+1}:{round_notes}"
     # Finale Einigung
+    final_res = ask_model("mistralai/Mixtral-8x7B-Instruct-v0.1", "Du bist der Moderator.", current_context + "Fasse alles final zusammen.")
+    history.append({"role": "assistant", "content": "### 🏆 FINALE ENTSCHEIDUNG"})
+    history.append({"role": "assistant", "content": final_res})
     yield history
+# Gradio 6 UI
+with gr.Blocks() as demo:
+    gr.Markdown("# 🏛️ Der Subraum-Stammtisch")
+    gr.Markdown("> Status: Initialisiere Prompt-Plenum auf Frequenz 0x42...")
     with gr.Row():
+        input_text = gr.Textbox(label="Input-Vektor (Deine Frage)", placeholder="Sollten wir zum Mars fliegen?")
+        rounds_slider = gr.Slider(minimum=1, maximum=3, value=1, step=1, label="Diskussionszyklen")
+    start_btn = gr.Button("Protokoll starten", variant="primary")
+    # type="messages" ist entscheidend für Gradio 6
+    chatbot = gr.Chatbot(label="Council Protokoll", height=600, type="messages")
     start_btn.click(run_council, inputs=[input_text, rounds_slider], outputs=[chatbot])
+# Theme in launch() verschoben
+demo.launch(theme=gr.themes.Soft())