plain_untuned

Sleeping

App Files Files Community

chthees commited on Dec 3, 2025

Commit

0414a9d

verified ·

1 Parent(s): c4e0e89

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -31

app.py CHANGED Viewed

@@ -1,15 +1,13 @@
 import gradio as gr
 from llama_cpp import Llama
-# --- 1. MODELL LADEN ---
 llm = Llama.from_pretrained(
     repo_id="simonper/Llama-3.2-1B-bnb-4bit_finetome-100k_gguf_3epochs_4bit",
     filename="Llama-3.2-1B.Q4_K_M.gguf",
     n_ctx=2048,
-    n_threads=2, # Optimiert für Hugging Face CPU Basic Tier
 )
-# --- 2. HELPER: PROMPT BAUEN ---
 def build_prompt(system_message: str, history: list[dict], user_message: str) -> str:
     lines = []
     if system_message:
@@ -25,7 +23,7 @@ def build_prompt(system_message: str, history: list[dict], user_message: str) ->
     lines.append("Assistant:")
     return "\n".join(lines)
-# --- 3. RESPOND FUNKTION ---
 def respond(
     message,
     history: list[dict[str, str]],
@@ -33,42 +31,39 @@ def respond(
     max_tokens,
     temperature,
     top_p,
-    repetition_penalty,  # <--- NEUER PARAMETER
     style_mode,
 ):
-    # --- A. Style Logik ---
     base_instruction = (
-        "Du bist ein hilfreicher Assistent zur Textumformulierung. "
-        "Gib die folgende Eingabe des Nutzers inhaltlich identisch zurück, ändere nur die Formulierungen."
     )
     context = ""
-    if style_mode == "Professionelle E-Mail":
-        context = "Formuliere die Eingabe extrem höflich und professionell (Business-Deutsch)."
-    elif style_mode == "Gen-Z / Jugendsprache":
-        context = "Formuliere die Eingabe in Jugendsprache (nutze Wörter wie 'cringe', 'wild', 'sus', Emojis)."
     elif style_mode == "Shakespeare":
-        context = "Formuliere die Eingabe in altmodischem, poetischem Deutsch."
-    elif style_mode == "Passiv-Aggressiv":
-        context = "Formuliere die Eingabe höflich, aber unterschwellig passiv-aggressiv."
-    elif style_mode == "Lustig/Ironisch":
-        context = "Formuliere die Eingabe lustig und ironisch."
     else:
-        context = "Antworte ganz normal."
-    final_system = f"{base_instruction} {context} Verändere nicht die Bedeutung."
-    # --- B. Prompt bauen ---
     prompt = build_prompt(final_system, history, message)
-    # --- C. Modell aufrufen ---
     output = llm(
         prompt,
         max_tokens=int(max_tokens),
         temperature=float(temperature),
         top_p=float(top_p),
-        repeat_penalty=float(repetition_penalty), # <--- HIER WIRD ER GENUTZT
         stop=["User:", "System:"],
         echo=False
     )
@@ -84,26 +79,23 @@ chatbot = gr.ChatInterface(
     additional_inputs=[
         gr.Textbox(value="", label="System Prompt (Hidden)", visible=False),
-        # Bestehende Slider
         gr.Slider(minimum=1, maximum=2048, value=512, label="Max Tokens"),
         gr.Slider(minimum=0.1, maximum=4.0, value=0.7, label="Temperature"),
         gr.Slider(minimum=0.1, maximum=1.0, value=0.95, label="Top-p"),
-        # NEUER SLIDER
-        # Standard 1.0 = Keine Strafe. 1.2 ist meist ein guter Wert für Llama.
-        gr.Slider(minimum=1.0, maximum=2.0, value=1.2, step=0.05, label="Repetition Penalty"),
-        # Style Dropdown
         gr.Dropdown(
-            choices=["Normal", "Professionelle E-Mail", "Gen-Z / Jugendsprache", "Shakespeare", "Passiv-Aggressiv", "Lustig/Ironisch"],
             value="Normal",
-            label="Wähle den Stil / Tonfall"
         )
     ],
 )
 with gr.Blocks() as demo:
-    gr.Markdown("# 🎭 Der Text-Wandler")
     with gr.Sidebar():
         gr.LoginButton()
     chatbot.render()

 import gradio as gr
 from llama_cpp import Llama
 llm = Llama.from_pretrained(
     repo_id="simonper/Llama-3.2-1B-bnb-4bit_finetome-100k_gguf_3epochs_4bit",
     filename="Llama-3.2-1B.Q4_K_M.gguf",
     n_ctx=2048,
+    n_threads=2,
 )
 def build_prompt(system_message: str, history: list[dict], user_message: str) -> str:
     lines = []
     if system_message:
     lines.append("Assistant:")
     return "\n".join(lines)
 def respond(
     message,
     history: list[dict[str, str]],
     max_tokens,
     temperature,
     top_p,
+    repetition_penalty,
     style_mode,
 ):
+    # Translated instruction
     base_instruction = (
+        "You are a friendly ChatBot that answers questions and can hold conversations. "
+        "Please always answer in one of the following styles: "
     )
     context = ""
+    # Logic keys updated to match the English Dropdown choices below
+    if style_mode == "Professional Email":
+        context = "Formulate the answer extremely politely and professionally (Business English)."
+    elif style_mode == "Gen-Z / Slang":
+        context = "Formulate the answer in Gen-Z slang (use words like 'cringe', 'wild', 'sus', emojis)."
     elif style_mode == "Shakespeare":
+        context = "Formulate the answer in old-fashioned, poetic English."
+    elif style_mode == "Funny/Ironic":
+        context = "Formulate the answer in a funny and ironic way."
     else:
+        context = "Answer normally."
+    final_system = f"{base_instruction} {context}"
     prompt = build_prompt(final_system, history, message)
     output = llm(
         prompt,
         max_tokens=int(max_tokens),
         temperature=float(temperature),
         top_p=float(top_p),
+        repeat_penalty=float(repetition_penalty),
         stop=["User:", "System:"],
         echo=False
     )
     additional_inputs=[
         gr.Textbox(value="", label="System Prompt (Hidden)", visible=False),
         gr.Slider(minimum=1, maximum=2048, value=512, label="Max Tokens"),
         gr.Slider(minimum=0.1, maximum=4.0, value=0.7, label="Temperature"),
         gr.Slider(minimum=0.1, maximum=1.0, value=0.95, label="Top-p"),
+        gr.Slider(minimum=1.0, maximum=2.0, value=1.3, step=0.05, label="Repetition Penalty"),
+        # Translated Dropdown Options
         gr.Dropdown(
+            choices=["Normal", "Professional Email", "Gen-Z / Slang", "Shakespeare", "Passive-Aggressive", "Funny/Ironic"],
             value="Normal",
+            label="Choose the Style / Tone"
         )
     ],
 )
 with gr.Blocks() as demo:
+    # Translated Title
+    gr.Markdown("# Advanced Chat Bot")
     with gr.Sidebar():
         gr.LoginButton()
     chatbot.render()