Spaces:

davidtran999
/

hue-portal-backendDocker

Running

App Files Files Community

davidtran999 commited on 17 days ago

Commit

03445af

verified ·

1 Parent(s): f8e149d

Upload backend/hue_portal/chatbot/router.py with huggingface_hub

Browse files

Files changed (1) hide show

backend/hue_portal/chatbot/router.py +45 -0

backend/hue_portal/chatbot/router.py CHANGED Viewed

@@ -8,6 +8,8 @@ from dataclasses import dataclass, field
 from enum import Enum
 from typing import Dict, Optional
 class IntentRoute(str, Enum):
     """High-level route for the chatbot pipeline."""
@@ -62,8 +64,17 @@ def _flag_keywords(query_lower: str) -> Dict[str, bool]:
             kw in query_lower
             for kw in [
                 "quyết định",
                 "thông tư",
                 "nghị quyết",
                 "kỷ luật",
                 "qd 69",
                 "qd 264",
@@ -84,6 +95,8 @@ class RouteDecision:
     rationale: str
     forced_intent: Optional[str] = None
     keyword_flags: Dict[str, bool] = field(default_factory=dict)
 def decide_route(query: str, intent: str, confidence: float) -> RouteDecision:
@@ -94,6 +107,7 @@ def decide_route(query: str, intent: str, confidence: float) -> RouteDecision:
     words = query_lower.split()
     keyword_flags = _flag_keywords(query_lower)
     has_doc_code = _has_document_code(query_lower)
     route = IntentRoute.SEARCH
     rationale = "default-search"
@@ -145,6 +159,19 @@ def decide_route(query: str, intent: str, confidence: float) -> RouteDecision:
                 rationale = f"keyword-override-{flag}"
                 break
     return RouteDecision(
         route=route,
         intent=intent,
@@ -152,5 +179,23 @@ def decide_route(query: str, intent: str, confidence: float) -> RouteDecision:
         rationale=rationale,
         forced_intent=forced_intent,
         keyword_flags=keyword_flags,
     )

 from enum import Enum
 from typing import Dict, Optional
+from hue_portal.chatbot.document_topics import DOCUMENT_TOPICS
 class IntentRoute(str, Enum):
     """High-level route for the chatbot pipeline."""
             kw in query_lower
             for kw in [
                 "quyết định",
+                "quyet dinh",
                 "thông tư",
+                "thong tu",
                 "nghị quyết",
+                "nghi quyet",
+                "nghị định",
+                "nghi dinh",
+                "luật",
+                "luat",
+                "điều ",
+                "dieu ",
                 "kỷ luật",
                 "qd 69",
                 "qd 264",
     rationale: str
     forced_intent: Optional[str] = None
     keyword_flags: Dict[str, bool] = field(default_factory=dict)
+    clarification_required: bool = False
+    topic_scores: Dict[str, float] = field(default_factory=dict)
 def decide_route(query: str, intent: str, confidence: float) -> RouteDecision:
     words = query_lower.split()
     keyword_flags = _flag_keywords(query_lower)
     has_doc_code = _has_document_code(query_lower)
+    topic_scores = _compute_topic_scores(query_lower)
     route = IntentRoute.SEARCH
     rationale = "default-search"
                 rationale = f"keyword-override-{flag}"
                 break
+    clarification_required = False
+    should_consider_legal = (
+        (forced_intent == "search_legal") or (intent == "search_legal") or keyword_flags["legal"]
+    )
+    if (
+        route == IntentRoute.SEARCH
+        and should_consider_legal
+        and not has_doc_code
+        and not forced_intent == "greeting"
+    ):
+        if topic_scores or confidence < 0.5:
+            clarification_required = True
     return RouteDecision(
         route=route,
         intent=intent,
         rationale=rationale,
         forced_intent=forced_intent,
         keyword_flags=keyword_flags,
+        clarification_required=clarification_required,
+        topic_scores=topic_scores,
     )
+def _compute_topic_scores(query_lower: str) -> Dict[str, float]:
+    scores: Dict[str, float] = {}
+    for topic in DOCUMENT_TOPICS:
+        keywords = topic.get("keywords", [])
+        score = 0.0
+        for keyword in keywords:
+            normalized_kw = keyword.lower()
+            if not normalized_kw:
+                continue
+            if normalized_kw in query_lower:
+                score += 1.5 if len(normalized_kw) > 5 else 1.0
+        if score > 0:
+            scores[topic["code"].upper()] = score
+    return scores