Spaces:

Nguyen5
/

chatbot

Sleeping

App Files Files Community

Nguyen5 commited on Dec 3, 2025

Commit

c517565

1 Parent(s): 8308ad9

commit

Browse files

Files changed (1) hide show

app.py +98 -22

app.py CHANGED Viewed

@@ -7,72 +7,148 @@ from supabase_client import supabase
 client = OpenAI()
 def build_viewer():
     resp = supabase.table("documents").select("content, metadata").execute()
     items = resp.data or []
     po_html = []
     hg_html = []
     for row in items:
         meta = row["metadata"]
         src = meta["source"]
-        anchor = meta["anchor_id"]
-        page = meta.get("page", "")
-        block_html = f"<div id='{anchor}'><b>{src} {page}</b><br>{row['content']}</div>"
         if "Prüfungsordnung" in src:
             po_html.append(block_html)
         else:
             hg_html.append(block_html)
     return "".join(po_html), "".join(hg_html)
-PO_HTML, HG_HTML = build_viewer()
 def transcribe(audio):
     if audio is None:
         return ""
-    with open(audio, "rb") as f:
-        res = client.audio.transcriptions.create(
-            model="whisper-1", file=f, language="de", temperature=0
-        )
-    return res.text.strip()
 def chat_fn(text, audio, history):
     text = text.strip() if text else ""
     if text:
         q = text
     else:
         q = transcribe(audio)
     answer, docs = rag_answer(q, history or [])
     html = "<ol>"
     for i, d in enumerate(docs):
         meta = d["metadata"]
-        anchor = meta["anchor_id"]
         snippet = d["content"][:200]
-        html += f"<li><a href='#{anchor}'><b>Quelle {i+1}</b></a><br>{snippet}...</li>"
     html += "</ol>"
     new_hist = (history or []) + [
         {"role": "user", "content": q},
-        {"role": "assistant", "content": answer}
     ]
-    return new_hist, html, gr.update(value=None)  # reset audio
 with gr.Blocks() as demo:
-    chatbot = gr.Chatbot()
-    text_input = gr.Textbox(label="Text Eingabe")
-    audio_input = gr.Audio(type="filepath", label="Mikrofon")
-    send = gr.Button("Senden")
-    po_view = gr.HTML(f"<div style='height:250px; overflow:auto'>{PO_HTML}</div>")
-    hg_view = gr.HTML(f"<div style='height:250px; overflow:auto'>{HG_HTML}</div>")
-    sources = gr.HTML()
-    send.click(
         chat_fn,
         inputs=[text_input, audio_input, chatbot],
         outputs=[chatbot, sources, audio_input]
     )
-demo.launch()

 client = OpenAI()
+# -------------------------------------------
+# DYNAMIC VIEWER – luôn load từ Supabase MỖI LẦN
+# -------------------------------------------
 def build_viewer():
+    """
+    Tạo viewer HTML từ bảng Documents mới nhất.
+    Viewer KHÔNG static, luôn lấy dữ liệu cập nhật.
+    """
     resp = supabase.table("documents").select("content, metadata").execute()
     items = resp.data or []
     po_html = []
     hg_html = []
     for row in items:
         meta = row["metadata"]
         src = meta["source"]
+        anchor = meta.get("anchor_id")
+        page = meta.get("page")
+        page_info = f"(Seite {page})" if page else ""
+        block_html = (
+            f"<div id='{anchor}' style='margin-bottom:14px;'>"
+            f"<b>{src} {page_info}</b><br>{row['content']}"
+            f"</div>"
+        )
         if "Prüfungsordnung" in src:
             po_html.append(block_html)
         else:
             hg_html.append(block_html)
     return "".join(po_html), "".join(hg_html)
+# -------------------------------------------
+# WHISPER – fixed ghi âm tiếng Đức + reset
+# -------------------------------------------
 def transcribe(audio):
     if audio is None:
         return ""
+    try:
+        with open(audio, "rb") as f:
+            res = client.audio.transcriptions.create(
+                model="whisper-1",
+                file=f,
+                language="de",
+                temperature=0.0
+            )
+        return (res.text or "").strip()
+    except Exception:
+        return ""
+# -------------------------------------------
+# MAIN CHAT FUNCTION
+# -------------------------------------------
 def chat_fn(text, audio, history):
     text = text.strip() if text else ""
+    # ƯU TIÊN TEXT – nếu có text thì bỏ audio
     if text:
         q = text
     else:
         q = transcribe(audio)
+    if not q:
+        return history, "<p>Bitte Text oder Mikrofon benutzen.</p>", gr.update(value=None)
+    # RAG
     answer, docs = rag_answer(q, history or [])
+    # Build nguồn
     html = "<ol>"
     for i, d in enumerate(docs):
         meta = d["metadata"]
+        anchor = meta.get("anchor_id")
         snippet = d["content"][:200]
+        html += (
+            f"<li>"
+            f"<a href='#{anchor}' style='font-weight:bold;'>"
+            f"Quelle {i+1}"
+            f"</a><br>"
+            f"{snippet}..."
+            f"</li>"
+        )
     html += "</ol>"
+    # HISTORY kiểu messages (Gradio)
     new_hist = (history or []) + [
         {"role": "user", "content": q},
+        {"role": "assistant", "content": answer},
     ]
+    # RESET AUDIO hoàn toàn
+    return new_hist, html, gr.update(value=None)
+# -------------------------------------------
+# UI
+# -------------------------------------------
 with gr.Blocks() as demo:
+    gr.Markdown("# ⚖️ Sprachbasierter Chatbot für Prüfungsrecht")
+    with gr.Row():
+        with gr.Column(scale=3):
+            chatbot = gr.Chatbot(label="Chat")
+            text_input = gr.Textbox(label="Text Eingabe", placeholder="Frage hier eingeben...")
+            audio_input = gr.Audio(
+                type="filepath",
+                label="Spracheingabe (Mikrofon)"
+            )
+            send_btn = gr.Button("Senden")
+        with gr.Column(scale=2):
+            # viewer luôn load dữ liệu mới nhất
+            po_html, hg_html = build_viewer()
+            po_view = gr.HTML(
+                f"<div style='height:250px;overflow:auto;border:1px solid #ccc;"
+                f"padding:10px'>{po_html}</div>"
+            )
+            hg_view = gr.HTML(
+                f"<div style='height:250px;overflow:auto;border:1px solid #ccc;"
+                f"padding:10px'>{hg_html}</div>"
+            )
+            sources = gr.HTML()
+    # Chat event
+    send_btn.click(
         chat_fn,
         inputs=[text_input, audio_input, chatbot],
         outputs=[chatbot, sources, audio_input]
     )
+demo.launch(ssr_mode=False)