Spaces:

Nexari-Research
/

Nexari-Server

Sleeping

App Files Files Community

Nexari-Research commited on Dec 3, 2025

Commit

98e4c13

verified ·

1 Parent(s): cda338b

Update tools_engine.py

Browse files

Files changed (1) hide show

tools_engine.py +29 -38

tools_engine.py CHANGED Viewed

@@ -1,26 +1,24 @@
 """
-tools_engine.py - Improved perform_web_search to return structured results.
 """
 from duckduckgo_search import DDGS
 from transformers import pipeline
 import re
-import logging
-logger = logging.getLogger("nexari-tools")
 print(">>> Tools: Loading Intent Classification Model...")
-# Use a lighter model or the one you had.
 intent_classifier = pipeline("zero-shot-classification", model="typeform/distilbert-base-uncased-mnli")
 def analyze_intent(user_text):
     if not user_text:
         return "general"
     text_lower = user_text.lower().strip()
-    # Direct triggers
-    direct_chat_triggers = ["hi","hello","hey","hlo","namaste","who are you"]
-    if text_lower in direct_chat_triggers:
         return "general"
     candidate_labels = ["internet search","general conversation","coding request","checking time"]
@@ -28,55 +26,48 @@ def analyze_intent(user_text):
         result = intent_classifier(user_text, candidate_labels)
         top_label = result['labels'][0]
         confidence = result['scores'][0]
         mapping = {
             "internet search": "internet_search",
             "general conversation": "general",
             "coding request": "coding_request",
             "checking time": "checking_time"
         }
-        # Threshold
         if confidence > 0.45:
             return mapping.get(top_label, "general")
-    except Exception as e:
-        logger.error(f"Intent Error: {e}")
     return "general"
 def perform_web_search(user_text, max_results=4):
     """
-    Returns structured dict: { "query": str, "results": [ {title, snippet, url} ] }
     """
     try:
-        # cleanup query
         query = user_text
-        remove_phrases = ["search for","find","google","lookup","what is","tell me about"]
-        q_lower = query.lower()
         for p in remove_phrases:
-            if q_lower.startswith(p):
-                query = query[len(p):].strip()
-        logger.info(f"Searching web for: {query}")
-        # DDGS execution
-        results_list = []
-        with DDGS() as ddgs:
-            # .text() returns an iterator
-            ddgs_gen = ddgs.text(query, max_results=max_results)
-            if ddgs_gen:
-                results_list = list(ddgs_gen)
-        structured = {"query": query, "results": []}
-        for r in results_list:
             title = r.get("title","").strip()
             body = re.sub(r'\s+',' ', r.get("body","").strip())
-            url = r.get("href") or r.get("url") or ""
-            snippet = body[:300] + "..." if len(body) > 300 else body
             structured["results"].append({"title": title, "snippet": snippet, "url": url})
         return structured
     except Exception as e:
-        logger.error(f"Search failed: {e}")
         return {"query": user_text, "results": []}

 """
+tools_engine.py - Improved perform_web_search to return structured results with URLs and snippets,
+and canonical intent detection unchanged.
 """
 from duckduckgo_search import DDGS
 from transformers import pipeline
 import re
 print(">>> Tools: Loading Intent Classification Model...")
 intent_classifier = pipeline("zero-shot-classification", model="typeform/distilbert-base-uncased-mnli")
 def analyze_intent(user_text):
     if not user_text:
         return "general"
     text_lower = user_text.lower().strip()
+    direct_chat_triggers = [
+        "hi","hello","hey","hlo","namaste",
+        "what is your name", "who are you", "your name"
+    ]
+    if text_lower in direct_chat_triggers or any(text_lower.startswith(t + " ") for t in direct_chat_triggers):
         return "general"
     candidate_labels = ["internet search","general conversation","coding request","checking time"]
         result = intent_classifier(user_text, candidate_labels)
         top_label = result['labels'][0]
         confidence = result['scores'][0]
         mapping = {
             "internet search": "internet_search",
             "general conversation": "general",
             "coding request": "coding_request",
             "checking time": "checking_time"
         }
         if confidence > 0.45:
             return mapping.get(top_label, "general")
+    except Exception:
+        pass
     return "general"
 def perform_web_search(user_text, max_results=4):
     """
+    Return structured results:
+    {
+      "query": "...",
+      "results": [
+         {"title": "...", "snippet": "...", "url": "..."},
+         ...
+      ]
+    }
     """
     try:
         query = user_text
+        # sanitize small verbs
+        remove_phrases = ["search for","find","google","look up","lookup","what is","tell me"]
+        q = query.lower()
         for p in remove_phrases:
+            q = q.replace(p, "")
+        q = q.strip() or query
+        results = list(DDGS().text(q, max_results=max_results))
+        structured = {"query": q, "results": []}
+        for r in results:
             title = r.get("title","").strip()
             body = re.sub(r'\s+',' ', r.get("body","").strip())
+            url = r.get("href") or r.get("url") or r.get("link") or ""
+            # short snippet
+            snippet = body[:320]
             structured["results"].append({"title": title, "snippet": snippet, "url": url})
         return structured
     except Exception as e:
+        print(f"Search error: {e}")
         return {"query": user_text, "results": []}