Spaces:

rahul7star
/

OhamLab-AI

Running

App Files Files Community

rahul7star commited on Oct 8, 2025

Commit

1ab5501

verified ·

1 Parent(s): 2f22182

Update app.py

Browse files

Files changed (1) hide show

app.py +167 -288

app.py CHANGED Viewed

@@ -1,319 +1,198 @@
-import os
-import re
-import textwrap
-import traceback
 import gradio as gr
 from openai import OpenAI
-# ---------------------------
-# Configuration
-# ---------------------------
-HF_ENV_VAR = "OPENAI_API_KEY"
-HF_TOKEN = os.environ.get(HF_ENV_VAR)
 if not HF_TOKEN:
-    raise RuntimeError(
-        f"Environment variable {HF_ENV_VAR} not found. Set {HF_ENV_VAR} before running."
-    )
-MODEL_ID = "openai/gpt-oss-20b"
-client = OpenAI(base_url="https://router.huggingface.co/v1", api_key=HF_TOKEN)
-# ---------------------------
-# Load research files (size-capped)
-# ---------------------------
-MAX_RESEARCH_CHARS = 6000  # adjust to stay within token limits
-def load_research_context() -> str:
-    """Concatenate .txt/.md files in repo root up to MAX_RESEARCH_CHARS."""
-    repo_root = os.path.dirname(os.path.abspath(__file__))
-    chunks, total = [], 0
-    for fname in sorted(os.listdir(repo_root)):
-        if fname.lower().endswith((".txt", ".md")):
-            with open(os.path.join(repo_root, fname), "r", encoding="utf-8") as f:
-                txt = f.read()
-            if total + len(txt) > MAX_RESEARCH_CHARS:
-                txt = txt[: MAX_RESEARCH_CHARS - total]
-            chunks.append(f"\n--- {fname} ---\n{txt}")
-            total += len(txt)
-            if total >= MAX_RESEARCH_CHARS:
-                break
-    return "\n".join(chunks)
-RESEARCH_CONTEXT = load_research_context()
-# ---------------------------
-# System prompt
-# ---------------------------
-def get_system_prompt(mode: str = "chat") -> str:
-    base = textwrap.dedent(f"""
-    You are OhamLab AI, a Dialectical Agentic CrossSphere Intelligence AI.
-    IMPORTANT GUIDELINES:
-    - Deliver a complete, self-contained answer in one message whenever possible.
-    - If the user types "continue", resume exactly where you left off and DO NOT repeat previously provided text.
-    - NEVER include runnable code blocks, scripts, or function/class definitions unless the user explicitly asks.
-    - If code is requested, ask one clarifying question if needed, then provide code.
-    - Express algorithms in plain English unless code is explicitly requested.
-    - If uncertain, label speculation and state confidence.
-    Mode: {mode}
-    --- RESEARCH CONTEXT (TRIMMED) ---
-    {RESEARCH_CONTEXT}
-    --- END CONTEXT ---
-    """).strip()
-    return base
-# ---------------------------
-# Conversation state
-# ---------------------------
-conversation_mode = "chat"
-history_messages = [{"role": "system", "content": get_system_prompt("chat")}]
-chat_history_for_ui = []
-MAX_HISTORY_CHARS = 9000
-def trim_history_by_chars(msgs, max_chars=MAX_HISTORY_CHARS):
-    if not msgs:
-        return msgs
-    system = msgs[0]
-    tail, total = [], len(system["content"])
     for m in reversed(msgs[1:]):
-        seg_len = len(m.get("content", ""))
-        if total + seg_len > max_chars:
-            break
         tail.append(m)
-        total += seg_len
-    return [system] + list(reversed(tail))
-# ---------------------------
-# Code-detection utilities
-# ---------------------------
-CODE_PATTERN = re.compile(
-    r"(```|```[a-zA-Z]*|^\s*def\s+|^\s*class\s+|^\s*import\s+|#include\s+|<\?php|<html>|^\s*using\s+namespace)",
-    re.MULTILINE,
-)
-def is_code_like(text: str) -> bool:
-    if not text:
-        return False
-    if CODE_PATTERN.search(text):
-        return True
-    lines = [ln for ln in text.splitlines() if ln.strip()]
-    if len(lines) >= 4:
-        codey = sum(
-            1 for ln in lines
-            if ";" in ln or "{" in ln or "}" in ln or ln.strip().endswith(":")
-        )
-        return codey / len(lines) > 0.35
-    return False
-def strip_code_blocks(text: str) -> str:
-    text = re.sub(r"```.*?```", "", text, flags=re.DOTALL)
-    text_lines = []
-    for ln in text.splitlines():
-        if re.match(r"^\s*(def |class |import |from |#include|using |<)", ln):
-            continue
-        if ln.strip().startswith("```") or ln.strip().endswith("```"):
-            continue
-        text_lines.append(ln)
-    cleaned = "\n".join(text_lines).strip()
-    return re.sub(r"\n{3,}", "\n\n", cleaned) or \
-        "[Content removed: model produced code which has been stripped.]"
-# ---------------------------
-# Model call helper
-# ---------------------------
-def call_model_get_response(messages, max_tokens=2000, allow_code=False) -> str:
-    msgs = trim_history_by_chars(messages)
     try:
         resp = client.chat.completions.create(
             model=MODEL_ID,
-            messages=msgs,
-            max_tokens=max_tokens,
-            temperature=0.7,
         )
-        content = resp.choices[0].message.content or ""
     except Exception as e:
-        raise
-    if not allow_code and is_code_like(content):
-        rewrite_instruction = (
-            "Rewrite the previous reply in clear prose — no code blocks, no imports, "
-            "no function/class definitions. Keep all reasoning and numeric details."
-        )
-        rewrite_msgs = [
-            msgs[0],
-            {"role": "assistant", "content": content},
-            {"role": "user", "content": rewrite_instruction},
-        ]
-        try:
-            resp2 = client.chat.completions.create(
-                model=MODEL_ID,
-                messages=rewrite_msgs,
-                max_tokens=max_tokens,
-                temperature=0.7,
-            )
-            content2 = resp2.choices[0].message.content or ""
-        except Exception:
-            return strip_code_blocks(content) + \
-                "\n\n⚠️ Note: rewrite failed; code removed."
-        if is_code_like(content2):
-            return strip_code_blocks(content2) + \
-                "\n\n⚠️ Note: model persisted in producing code; sanitized."
-        return content2
-    return content
-# ---------------------------
-# Chat logic
-# ---------------------------
-def get_last_assistant_tail(max_chars=1200) -> str:
-    for m in reversed(history_messages):
-        if m["role"] == "assistant" and m.get("content"):
-            return m["content"][-max_chars:]
-    return ""
-CONTINUE_KEYWORDS = {"continue", "carry on", "go on", "proceed", "resume", "next"}
-def user_requested_code(user_text: str) -> bool:
-    t = (user_text or "").lower()
-    triggers = ["show code", "give me code", "provide code",
-                "script", "python", "javascript", "implementation"]
-    return any(k in t for k in triggers)
-def chat_with_model(user_message, chat_history):
-    global history_messages, chat_history_for_ui, conversation_mode
-    user_message = (user_message or "").strip()
-    if not user_message:
-        return chat_history, ""
-    lower = user_message.lower().strip()
-    # Mode switching
-    if "switch to research mode" in lower:
-        conversation_mode = "research"
-        history_messages = [{"role": "system",
-                             "content": get_system_prompt("research")}]
-        return chat_history + [("🟢 Mode switched", "🔬 Research Mode activated.")], ""
-    if "switch to chat mode" in lower:
-        conversation_mode = "chat"
-        history_messages = [{"role": "system",
-                             "content": get_system_prompt("chat")}]
-        return chat_history + [("🟢 Mode switched", "💬 Chat Mode activated.")], ""
-    allow_code = user_requested_code(user_message)
-    if lower in CONTINUE_KEYWORDS:
-        last_tail = get_last_assistant_tail()
-        resume_hint = (
-            "User requested continuation. Resume exactly where you left off "
-            "and DO NOT repeat earlier sections.\n\nLast assistant message tail:\n"
-            + last_tail
-        )
-        history_messages.append({"role": "user", "content": resume_hint})
-    else:
-        history_messages.append({"role": "user", "content": user_message})
-    history_messages[:] = trim_history_by_chars(history_messages)
-    try:
-        bot_text = call_model_get_response(
-            history_messages, max_tokens=2000, allow_code=allow_code
-        )
-    except Exception as e:
-        tb = traceback.format_exc()
-        bot_text = f"⚠️ **Error**: {e}\n\nTraceback:\n{tb.splitlines()[-6:]}"
-    history_messages.append({"role": "assistant", "content": bot_text})
-    chat_history_for_ui.append((user_message, bot_text))
-    return chat_history_for_ui, ""
-def reset_chat():
-    global history_messages, chat_history_for_ui
-    history_messages = [{"role": "system", "content": get_system_prompt(conversation_mode)}]
-    chat_history_for_ui = []
     return []
-# ---------------------------
-# Gradio UI with working Send button
-# ---------------------------
-# Gradio UI
-# ---------------------------
 def build_ui():
-    with gr.Blocks(
-        theme=gr.themes.Soft(),
-        css="""
-        #chatbot {
-            background-color: #f9f9fb;
-            border-radius: 12px;
-            padding: 10px;
-            overflow-y: auto;
-        }
-        .user-bubble {
-            background: #4a90e2;
-            color: white;
-            border-radius: 14px;
-            padding: 8px 12px;
-            margin: 6px;
-            max-width: 75%;
-            align-self: flex-end;
-            font-size: 14px;
-        }
-        .bot-bubble {
-            background: #e6e6e6;
-            color: #333;
-            border-radius: 14px;
-            padding: 8px 12px;
-            margin: 6px;
-            max-width: 75%;
-            align-self: flex-start;
-            font-size: 14px;
-        }
-        #controls {
-            display: flex;
-            gap: 8px;
-            align-items: center;
-            margin-top: 6px;
-        }
-        #topbar {
-            display: flex;
-            justify-content: flex-end;
-            gap: 8px;
-            margin-bottom: 6px;
-        }
-        """
-    ) as demo:
-        # Top bar with close + clear
-        with gr.Row(elem_id="topbar"):
-            close_btn = gr.Button("❌", size="sm")
-            clear_btn = gr.Button("🧹 Clear", size="sm")
-        chatbot = gr.Chatbot(
-            label="",
-            height=350,   # reduced height so input is visible
-            elem_id="chatbot",
-            type="tuples",
-            bubble_full_width=False,
-            avatar_images=("👤", "🤖"),
-        )
-        with gr.Row(elem_id="controls"):
-            msg = gr.Textbox(
-                placeholder="Type your message here...",
-                lines=2,
-                scale=8,
-            )
-            submit_btn = gr.Button("🚀 Send", variant="primary", scale=2)
-        # Wire buttons
-        submit_btn.click(chat_with_model, inputs=[msg, chatbot], outputs=[msg, chatbot])
-        msg.submit(chat_with_model, inputs=[msg, chatbot], outputs=[msg, chatbot])
-        clear_btn.click(reset_chat, inputs=None, outputs=chatbot)
-        demo.launch(server_name="0.0.0.0", server_port=7860, share=False)
     return demo
-# ---------------------------
-# Entrypoint
-# ---------------------------
 if __name__ == "__main__":
-    print("Starting Aerelyth with size-capped research context…")
-    build_ui()

+import os, re, time, json, textwrap, traceback, numpy as np
+from typing import List
 import gradio as gr
 from openai import OpenAI
+from huggingface_hub import list_repo_files, hf_hub_download
+# ==========================================================
+# CONFIG
+# ==========================================================
+REPO_ID = "rahul7star/OhamLab-LLM"
+API_KEY_ENV = "OPENAI_API_KEY"
+HF_TOKEN = os.getenv(API_KEY_ENV)
 if not HF_TOKEN:
+    raise RuntimeError(f"Missing {API_KEY_ENV}")
+MODEL_ID = "openai/gpt-4o-mini"      # efficient chat model
+EMBED_MODEL = "text-embedding-3-small"
+CACHE_FILE = "/tmp/ohamlab_emb_cache.json"
+client = OpenAI(api_key=HF_TOKEN)
+LOG_FILE = "ohamlab_chat.log"
+def log(msg: str):
+    ts = time.strftime("%Y-%m-%d %H:%M:%S")
+    line = f"[{ts}] {msg}"
+    print(line)
+    try:
+        with open(LOG_FILE, "a", encoding="utf-8") as f:
+            f.write(line + "\n")
+    except Exception:
+        pass
+# ==========================================================
+# KNOWLEDGE SCANNER + EMBEDDINGS
+# ==========================================================
+def load_all_md_from_repo(repo_id: str) -> List[str]:
+    """Scan all .md files in the repo and return concatenated chunks."""
+    try:
+        files = list_repo_files(repo_id=repo_id, repo_type="model", token=HF_TOKEN)
+        md_files = [f for f in files if f.lower().endswith(".md")]
+        if not md_files:
+            log("⚠️ No markdown files found.")
+            return []
+        chunks = []
+        for fname in md_files:
+            try:
+                local_path = hf_hub_download(repo_id, filename=fname, token=HF_TOKEN)
+                with open(local_path, "r", encoding="utf-8") as f:
+                    text = f.read()
+                text = re.sub(r"<[^>]+>", "", text)  # strip HTML
+                # Split into ~500 char chunks
+                buf = ""
+                for line in text.splitlines():
+                    buf += line.strip() + " "
+                    if len(buf) > 500:
+                        chunks.append(buf.strip())
+                        buf = ""
+                if buf:
+                    chunks.append(buf.strip())
+                log(f"Loaded {fname} ({len(text)} chars → {len(chunks)} chunks)")
+            except Exception as e:
+                log(f"⚠️ Failed to load {fname}: {e}")
+        return chunks
+    except Exception as e:
+        log(f"⚠️ Repo scan failed: {e}")
+        return []
+def get_embeddings(texts: List[str]) -> np.ndarray:
+    if not texts:
+        return np.zeros((1, 1536))
+    try:
+        res = client.embeddings.create(model=EMBED_MODEL, input=texts)
+        return np.array([r.embedding for r in res.data])
+    except Exception as e:
+        log(f"Embedding error: {e}")
+        return np.zeros((len(texts), 1536))
+def load_knowledge_cache() -> tuple[list[str], np.ndarray]:
+    """Load embeddings from cache or regenerate from repo."""
+    if os.path.exists(CACHE_FILE):
+        try:
+            with open(CACHE_FILE, "r", encoding="utf-8") as f:
+                data = json.load(f)
+            chunks = data["chunks"]
+            embs = np.array(data["embs"])
+            log(f"Loaded cached embeddings: {len(chunks)} chunks.")
+            return chunks, embs
+        except Exception:
+            pass
+    log("Scanning Markdown files in repo for knowledge base...")
+    chunks = load_all_md_from_repo(REPO_ID)
+    embs = get_embeddings(chunks)
+    try:
+        json.dump({"chunks": chunks, "embs": embs.tolist()}, open(CACHE_FILE, "w"))
+    except Exception:
+        pass
+    log(f"Knowledge base ready: {len(chunks)} chunks.")
+    return chunks, embs
+KNOWLEDGE_CHUNKS, KNOWLEDGE_EMBS = load_knowledge_cache()
+# ==========================================================
+# RETRIEVAL
+# ==========================================================
+def get_relevant_context(query: str, top_k=3) -> str:
+    if not KNOWLEDGE_CHUNKS or not query.strip():
+        return ""
+    q_emb = get_embeddings([query])[0]
+    sims = np.dot(KNOWLEDGE_EMBS, q_emb) / (
+        np.linalg.norm(KNOWLEDGE_EMBS, axis=1) * np.linalg.norm(q_emb)
+    )
+    top_idx = np.argsort(sims)[-top_k:][::-1]
+    return "\n\n".join(KNOWLEDGE_CHUNKS[i] for i in top_idx)
+# ==========================================================
+# CHAT ENGINE
+# ==========================================================
+SYSTEM_PROMPT = (
+    "You are OhamLab AI — a concise, factual chat assistant.\n"
+    "When relevant, use the OhamLab knowledge base provided in context.\n"
+    "Never show code unless explicitly requested. Keep tone professional and calm."
+)
+history = [{"role": "system", "content": SYSTEM_PROMPT}]
+chat_ui_history = []
+MAX_HISTORY_CHARS = 3000
+def trim_msgs(msgs, max_chars=MAX_HISTORY_CHARS):
+    sys = msgs[0]
+    tail, total = [], len(sys["content"])
     for m in reversed(msgs[1:]):
+        seg = len(m["content"])
+        if total + seg > max_chars: break
         tail.append(m)
+        total += seg
+    return [sys] + list(reversed(tail))
+def chat(user_msg, chat_hist):
+    global history, chat_ui_history
+    user_msg = (user_msg or "").strip()
+    if not user_msg:
+        return chat_ui_history, ""
+    context = get_relevant_context(user_msg)
+    if context:
+        user_msg += f"\n\n[Context]\n{context[:1500]}"
+    history.append({"role": "user", "content": user_msg})
+    trimmed = trim_msgs(history)
     try:
         resp = client.chat.completions.create(
             model=MODEL_ID,
+            messages=trimmed,
+            max_tokens=600,
+            temperature=0.6,
         )
+        reply = resp.choices[0].message.content.strip()
     except Exception as e:
+        log(f"Chat error: {e}")
+        reply = "I'm experiencing a temporary issue. Please try again shortly."
+    history.append({"role": "assistant", "content": reply})
+    chat_ui_history.append((user_msg, reply))
+    history[:] = trim_msgs(history)
+    log(f"USER: {user_msg[:60]} | BOT: {reply[:60]}")
+    return chat_ui_history, ""
+def reset():
+    global history, chat_ui_history
+    history = [{"role": "system", "content": SYSTEM_PROMPT}]
+    chat_ui_history = []
+    log("Chat reset.")
     return []
+# ==========================================================
+# UI
+# ==========================================================
 def build_ui():
+    with gr.Blocks(theme=gr.themes.Soft()) as demo:
+        gr.Markdown("### 💬 OhamLab AI — Knowledge Chat (Markdown-Aware)")
+        chatbot = gr.Chatbot(height=350)
+        msg = gr.Textbox(placeholder="Ask anything about OhamLab...", lines=1)
+        send = gr.Button("Send", variant="primary")
+        clear = gr.Button("Clear")
+        send.click(chat, inputs=[msg, chatbot], outputs=[chatbot, msg])
+        msg.submit(chat, inputs=[msg, chatbot], outputs=[chatbot, msg])
+        clear.click(reset, None, chatbot)
+    demo.launch(server_name="0.0.0.0", server_port=7860)
     return demo
 if __name__ == "__main__":
+    log("Starting OhamLab AI Chat Agent (Markdown Knowledge)...")
+    build_ui()