Spaces:

melikakheirieh
/

nl2sql-copilot

Running

App Files Files Community

Melika Kheirieh commited on 27 days ago

Commit

6f6e439

1 Parent(s): b432020

fix(planner): increase OpenAI timeout & add graceful timeout handling

Browse files

Files changed (2) hide show

adapters/llm/openai_provider.py +1 -1
nl2sql/planner.py +19 -1

adapters/llm/openai_provider.py CHANGED Viewed

@@ -48,7 +48,7 @@ class OpenAIProvider(LLMProvider):
         api_key, base_url, model = _resolve_api_config()
         os.environ["OPENAI_API_KEY"] = api_key
         os.environ["OPENAI_BASE_URL"] = base_url
-        self.client = OpenAI()
         self.model = model
         # last call usage/metadata for tracing
         self._last_usage: dict[str, Any] = {}

         api_key, base_url, model = _resolve_api_config()
         os.environ["OPENAI_API_KEY"] = api_key
         os.environ["OPENAI_BASE_URL"] = base_url
+        self.client = OpenAI(timeout=120.0)
         self.model = model
         # last call usage/metadata for tracing
         self._last_usage: dict[str, Any] = {}

nl2sql/planner.py CHANGED Viewed

@@ -86,6 +86,18 @@ def _pick_relevant_tables(schema_text: str, question: str, k: int = 3) -> str:
         return schema_text
 # ------------------------------ Planner ------------------------------
 class Planner:
     """Planner wrapper around the LLM provider."""
@@ -98,7 +110,10 @@ class Planner:
         self._plan_cache: dict[tuple[str, int, int], tuple[str, int, int, float]] = {}
     def run(self, *, user_query: str, schema_preview: str) -> Dict[str, Any]:
         trimmed = _pick_relevant_tables(schema_preview or "", user_query or "", k=3)
         key: tuple[str, int, int] = (
             self.model_id,
@@ -108,8 +123,11 @@ class Planner:
         if key in self._plan_cache:
             plan_text, pin, pout, cost = self._plan_cache[key]
         else:
             plan_text, pin, pout, cost = self.llm.plan(
-                user_query=user_query, schema_preview=trimmed
             )
             self._plan_cache[key] = (plan_text, pin, pout, cost)

         return schema_text
+# --------- Add schema size check ---------
+def _trim_if_large(schema_text: str, max_chars: int = 8000) -> str:
+    """Trim schema if it's too large to prevent timeout"""
+    if len(schema_text) <= max_chars:
+        return schema_text
+    # Keep first part of schema that fits
+    lines = schema_text[:max_chars].splitlines()
+    # Try to end at a complete line
+    return "\n".join(lines[:-1]) if len(lines) > 1 else lines[0]
 # ------------------------------ Planner ------------------------------
 class Planner:
     """Planner wrapper around the LLM provider."""
         self._plan_cache: dict[tuple[str, int, int], tuple[str, int, int, float]] = {}
     def run(self, *, user_query: str, schema_preview: str) -> Dict[str, Any]:
+        # First apply relevance filtering
         trimmed = _pick_relevant_tables(schema_preview or "", user_query or "", k=3)
+        # Then apply size limit to prevent timeout
+        trimmed = _trim_if_large(trimmed, max_chars=8000)
         key: tuple[str, int, int] = (
             self.model_id,
         if key in self._plan_cache:
             plan_text, pin, pout, cost = self._plan_cache[key]
         else:
+            # Call with increased timeout
             plan_text, pin, pout, cost = self.llm.plan(
+                user_query=user_query,
+                schema_preview=trimmed,
+                timeout=120,  # Increase timeout for large schemas
             )
             self._plan_cache[key] = (plan_text, pin, pout, cost)