Multi_Model_AI_AGENT_VectorDB_langchain_json

Sleeping

App Files Files Community

Seth0330 commited on Jun 12, 2025

Commit

657f503

verified ·

1 Parent(s): 4e778f2

Update app.py

Browse files

Files changed (1) hide show

app.py +63 -108

app.py CHANGED Viewed

@@ -1,13 +1,14 @@
 import streamlit as st
 import json
-import difflib
-import re
 def normalize(s):
     return ' '.join(str(s).lower().replace("_", " ").replace("-", " ").replace(".", " ").split())
 def is_fuzzy_match(a, b, threshold=0.7):
-    ratio = difflib.SequenceMatcher(None, a, b).ratio()
     return ratio >= threshold or a in b or b in a
 def recursive_fuzzy_value_search(target_value):
@@ -17,26 +18,13 @@ def recursive_fuzzy_value_search(target_value):
         def _search(obj, path):
             if isinstance(obj, dict):
                 for k, v in obj.items():
-                    # Match ANY primitive value (str, int, float, bool)
                     if isinstance(v, (str, int, float, bool)) and is_fuzzy_match(norm_target, normalize(v)):
                         matches.append({
-                            "match_path": path + [k],
-                            "matched_value": v,
                             "key": k,
-                            "record": obj,
-                            "file": file_name
                         })
-                    # Check inside nested dicts
-                    if isinstance(v, dict):
-                        for nk, nv in v.items():
-                            if isinstance(nv, (str, int, float, bool)) and is_fuzzy_match(norm_target, normalize(nv)):
-                                matches.append({
-                                    "match_path": path + [k, nk],
-                                    "matched_value": nv,
-                                    "key": nk,
-                                    "record": v,
-                                    "file": file_name
-                                })
                     _search(v, path + [k])
             elif isinstance(obj, list):
                 for idx, item in enumerate(obj):
@@ -44,105 +32,72 @@ def recursive_fuzzy_value_search(target_value):
         _search(data, [])
     return matches
-def show_all_strings():
-    found = []
-    for file_name, data in st.session_state.json_data.items():
-        def recursive(obj, path):
-            if isinstance(obj, dict):
-                for k, v in obj.items():
-                    if isinstance(v, (str, int, float, bool)):
-                        found.append(f"{file_name} | {'.'.join(path + [k])} = {v}")
-                    elif isinstance(v, dict):
-                        for nk, nv in v.items():
-                            if isinstance(nv, (str, int, float, bool)):
-                                found.append(f"{file_name} | {'.'.join(path + [k, nk])} = {nv}")
-                    recursive(v, path + [k])
-            elif isinstance(obj, list):
-                for idx, item in enumerate(obj):
-                    recursive(item, path + [f"[{idx}]"])
-        recursive(data, [])
-    return found
-def handle_user_query(query):
-    patterns = [
-        r"(?:last\s*login.*?for|when\s+did)\s+([a-zA-Z0-9 _\-\.@]+)",
-        r"when\s+was\s+([a-zA-Z0-9 _\-\.@]+)\s+last\s+(?:login|logged\s*in)",
-        r"last\s*login\s*of\s+([a-zA-Z0-9 _\-\.@]+)",
-        r"(?:info|details|record) for\s+([a-zA-Z0-9 _\-\.@]+)"
-    ]
-    found_value = None
-    for pat in patterns:
-        m = re.search(pat, query, re.IGNORECASE)
-        if m:
-            found_value = m.group(1).strip()
-            break
-    if not found_value:
-        # Fallback: any word/phrase of 1+ char (letters, digits, spaces, dashes, underscores, dots)
-        m = re.search(r"([A-Za-z0-9][A-Za-z0-9 _\-\.@]*)", query)
-        if m:
-            found_value = m.group(1).strip()
-    if found_value:
-        results = recursive_fuzzy_value_search(found_value)
-        if not results:
-            return f"No records found for '{found_value}' in any file."
-        answers = []
-        for res in results:
-            answers.append(
-                f"**{res['matched_value']}** (in file `{res['file']}` | key: `{res['key']}` | path: `{'.'.join(res['match_path'])}`)"
-            )
-        return "\n\n".join(answers)
-    else:
-        return "No valid search value detected. Try a person's name, number, product, device, etc."
-# --- Streamlit UI setup ---
 if "json_data" not in st.session_state:
     st.session_state.json_data = {}
-if "messages" not in st.session_state:
-    st.session_state.messages = []
-if "temp_input" not in st.session_state:
-    st.session_state.temp_input = ""
-if "files_loaded" not in st.session_state:
-    st.session_state.files_loaded = False
-st.set_page_config(page_title="Flexible JSON Fuzzy Search", layout="wide")
-st.title("Instant JSON-Backed Q&A (Flexible Fuzzy Search — All Keys & Types!)")
 uploaded_files = st.sidebar.file_uploader(
     "Choose one or more JSON files", type="json", accept_multiple_files=True
 )
-if uploaded_files and not st.session_state.files_loaded:
     st.session_state.json_data.clear()
     for f in uploaded_files:
-        try:
-            content = json.load(f)
-            st.session_state.json_data[f.name] = content
-            st.sidebar.success(f"Loaded: {f.name}")
-        except Exception as e:
-            st.sidebar.error(f"Error reading {f.name}: {e}")
-    st.session_state.messages = []
-    st.session_state.files_loaded = True
-elif not uploaded_files:
-    st.session_state.json_data.clear()
-    st.session_state.files_loaded = False
-st.markdown("### Ask about ANY value (name, product, number, device, etc) — partials/typos/substring OK!")
-for msg in st.session_state.messages:
-    if msg["role"] == "user":
-        st.markdown(f"<div style='color: #4F8BF9;'><b>User:</b> {msg['content']}</div>", unsafe_allow_html=True)
-    else:
-        st.markdown(f"<div style='color: #1C6E4C;'><b>Agent:</b> {msg['content']}</div>", unsafe_allow_html=True)
-def send_message():
-    user_input = st.session_state.temp_input
-    if user_input.strip():
-        st.session_state.messages.append({"role": "user", "content": user_input})
-        answer = handle_user_query(user_input)
-        st.session_state.messages.append({"role": "assistant", "content": answer})
-        st.session_state.temp_input = ""
-if st.session_state.json_data:
-    st.text_input("Your message:", key="temp_input", on_change=send_message)
-    if st.button("Show all values in uploaded JSONs"):
-        st.write(show_all_strings())
 else:
-    st.info("Please upload at least one JSON file to start chatting.")

 import streamlit as st
 import json
+from langchain.chat_models import ChatOpenAI
+from langchain.agents import initialize_agent, Tool
 def normalize(s):
     return ' '.join(str(s).lower().replace("_", " ").replace("-", " ").replace(".", " ").split())
 def is_fuzzy_match(a, b, threshold=0.7):
+    from difflib import SequenceMatcher
+    ratio = SequenceMatcher(None, a, b).ratio()
     return ratio >= threshold or a in b or b in a
 def recursive_fuzzy_value_search(target_value):
         def _search(obj, path):
             if isinstance(obj, dict):
                 for k, v in obj.items():
                     if isinstance(v, (str, int, float, bool)) and is_fuzzy_match(norm_target, normalize(v)):
                         matches.append({
+                            "file": file_name,
                             "key": k,
+                            "path": ".".join(path + [k]),
+                            "value": v
                         })
                     _search(v, path + [k])
             elif isinstance(obj, list):
                 for idx, item in enumerate(obj):
         _search(data, [])
     return matches
+# LangChain Tool for LLM
+def json_search_tool(query: str) -> str:
+    """Search all uploaded JSON files for any value (fuzzy match); returns matching fields and values."""
+    results = recursive_fuzzy_value_search(query)
+    if not results:
+        return f"No match for '{query}'."
+    answer = []
+    for res in results:
+        answer.append(f"{res['file']} | {res['key']} ({res['path']}): {res['value']}")
+    return "\n".join(answer)
+# Streamlit UI
 if "json_data" not in st.session_state:
     st.session_state.json_data = {}
+if "chat_history" not in st.session_state:
+    st.session_state.chat_history = []
+st.set_page_config(page_title="Chat with Your JSONs!", layout="wide")
+st.title("Chat with Your JSON Files (powered by GPT + instant JSON search)")
 uploaded_files = st.sidebar.file_uploader(
     "Choose one or more JSON files", type="json", accept_multiple_files=True
 )
+if uploaded_files:
     st.session_state.json_data.clear()
     for f in uploaded_files:
+        content = json.load(f)
+        st.session_state.json_data[f.name] = content
+    st.sidebar.success("All JSON files loaded.")
+import os
+OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
+if not OPENAI_API_KEY:
+    st.warning("You must set your OPENAI_API_KEY for chat.")
 else:
+    llm = ChatOpenAI(model_name="gpt-4.1", openai_api_key=OPENAI_API_KEY)
+    tools = [
+        Tool(
+            name="json_search",
+            func=json_search_tool,
+            description="Find any value (name, product, number, etc) across all loaded JSON files. Input is what the user wants to find (e.g. 'iphone', 'apps installed', or 'alice')."
+        )
+    ]
+    agent = initialize_agent(
+        tools=tools,
+        llm=llm,
+        agent="chat-conversational-react-description",
+        verbose=False
+    )
+    for msg in st.session_state.chat_history:
+        if msg["role"] == "user":
+            st.markdown(f"<div style='color: #4F8BF9;'><b>User:</b> {msg['content']}</div>", unsafe_allow_html=True)
+        else:
+            st.markdown(f"<div style='color: #1C6E4C;'><b>Agent:</b> {msg['content']}</div>", unsafe_allow_html=True)
+    def send_chat():
+        user_input = st.session_state.temp_input
+        if user_input.strip():
+            st.session_state.chat_history.append({"role": "user", "content": user_input})
+            agent_reply = agent.run(user_input)
+            st.session_state.chat_history.append({"role": "assistant", "content": agent_reply})
+            st.session_state.temp_input = ""
+    if st.session_state.json_data:
+        st.text_input("Your message:", key="temp_input", on_change=send_chat)
+    else:
+        st.info("Please upload at least one JSON file to start chatting.")