Final_Agent_HF_Course

Sleeping

App Files Files Community

selim-ba commited on Jun 28, 2025

Commit

b27dd95

verified ·

1 Parent(s): ef79f14

Update app.py

Browse files

Files changed (1) hide show

app.py +242 -453

app.py CHANGED Viewed

@@ -23,25 +23,18 @@ except OSError:
     nlp = spacy.load("en_core_web_sm")
-# (Keep Constants as is)
-# --- Constants ---
-DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
-# --- Basic Agent Definition ---
-# ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
-# class BasicAgent:
-#    def __init__(self):
-#        print("BasicAgent initialized.")
-#    def __call__(self, question: str) -> str:
-#        print(f"Agent received question (first 50 chars): {question[:50]}...")
-#        fixed_answer = "This is a default answer."
-#        print(f"Agent returning fixed answer: {fixed_answer}")
-#        return fixed_answer
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 class SuperSmartAgent:
     def __init__(self):
@@ -50,99 +43,161 @@ class SuperSmartAgent:
             extract_format=wikipediaapi.ExtractFormat.WIKI,
             user_agent='SelimResearchAgent/1.0'
         )
         self.graph = self._build_graph() # Build graph after initializing wiki_wiki
     def _build_graph(self):
-        # Helper functions (can be class methods or nested as before)
-        def score_text(text):
-            alnum_count = sum(c.isalnum() for c in text)
-            space_count = text.count(' ')
-            punctuation_count = sum(c in string.punctuation for c in text)
-            ends_properly = text[-1] in '.!?'
-            score = alnum_count + space_count
-            if ends_properly:
-                score += 5
-            return score
-        def check_reversed(state):
-            question = state["question"]
-            reversed_candidate = question[::-1]
-            original_score = score_text(question)
-            reversed_score = score_text(reversed_candidate)
-            if reversed_score > original_score:
-                state["is_reversed"] = True
-            else:
-                state["is_reversed"] = False
-            return state
-        def fix_question(state):
-            if state.get("is_reversed", False):
-                state["question"] = state["question"][::-1]
-            return state
-        def check_riddle_or_trick(state):
-            q = state["question"].lower()
-            keywords = ["opposite of", "if you understand", "riddle", "trick question", "what comes next", "i speak without"]
-            state["is_riddle"] = any(kw in q for kw in keywords)
-            return state
-        def solve_riddle(state):
-            q = state["question"].lower()
-            if "opposite of the word" in q:
-                if "left" in q:
-                    state["response"] = "right"
-                elif "up" in q:
-                    state["response"] = "down"
-                elif "hot" in q:
-                    state["response"] = "cold"
-                else:
-                    state["response"] = "Unknown opposite."
-            else:
-                state["response"] = "Could not solve riddle."
-            return state
-        def check_python_suitability(state):
-            question = state["question"].lower()
-            patterns = ["sum", "average", "count", "sort", "generate", "regex", "convert"]
-            state["is_python"] = any(word in question for word in patterns)
-            return state
-        def generate_code(state):
-            q = state["question"].lower()
-            if "sum" in q:
-                state["response"] = "numbers = [1, 2, 3]\nprint(sum(numbers))"
-            elif "average" in q:
-                state["response"] = "numbers = [1, 2, 3]\nprint(sum(numbers) / len(numbers))"
-            elif "sort" in q:
-                state["response"] = "data = [3, 1, 2]\ndata.sort()\nprint(data)"
             else:
-                state["response"] = "# Code generation not implemented for this case."
-            return state
-        def fallback(state):
-            state["response"] = "This question doesn't require Python or is unclear."
-            return state
-        def check_reasoning_needed(state):
-            q = state["question"].lower()
-            needs_reasoning = any(word in q for word in ["whose", "only", "first", "after", "before", "no longer", "not", "but", "except"])
-            state["needs_reasoning"] = needs_reasoning
-            return state
-        def check_wikipedia_suitability(state):
-            q = state["question"].lower()
-            triggers = [
-                "wikipedia", "who is", "what is", "when did", "where is",
-                "tell me about", "how many", "how much", "what was the",
-                "describe", "explain", "information about", "details about",
-                "history of", "facts about", "define", "give me data on"
-            ]
-            state["is_wiki"] = any(trigger in q for trigger in triggers)
-            return state
-        # --- MODIFIED/NEW HELPER METHODS (NOW PART OF THE CLASS) ---
-        # These methods are now part of the SuperSmartAgent class,
-        # so they can access self.wiki_wiki and other class properties.
     def get_relevant_context(self, question, search_results):
         """
@@ -218,7 +273,7 @@ class SuperSmartAgent:
         context = re.sub(r'\[\d+\]', '', context)  # Remove [1], [2], etc.
         context = re.sub(r'<ref[^>]*>.*?<\/ref>', '', context, flags=re.DOTALL | re.IGNORECASE) # Remove <ref> tags
         context = re.sub(r'\{\{.*?\}\}', '', context, flags=re.DOTALL) # Remove {{templates}}
-        context = re.sub(r'{\|.*?\|\}', '', context, flags=re.DOTALL) # Remove wiki tables (if extract_tables_from_wikipedia doesn't catch all)
         context = re.sub(r'==\s*See also\s*==.*?$', '', context, flags=re.DOTALL | re.IGNORECASE) # Remove "See also" section and anything after
         context = re.sub(r'==\s*References\s*==.*?$', '', context, flags=re.DOTALL | re.IGNORECASE) # Remove "References" section and anything after
         context = re.sub(r'\s+', ' ', context).strip() # Normalize whitespace
@@ -249,6 +304,9 @@ class SuperSmartAgent:
                 return state
             context = self.get_relevant_context(question, search_results)
             if not context:
                 state["response"] = "Sorry, I couldn't find detailed relevant information."
                 return state
@@ -327,7 +385,7 @@ class SuperSmartAgent:
             if not re.search(r'\d+', answer):
                 # If question asks for a number but answer has no number, it's likely wrong
                 return False
         # Check for year/date answers for "when" questions
         if "when" in question_lower or "year" in question_lower:
             if not re.search(r'\b\d{4}\b', answer) and not re.search(r'\b(Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec)\w*\s+\d{1,2}(?:st|nd|rd|th)?,\s+\d{4}\b', answer):
@@ -452,7 +510,7 @@ class SuperSmartAgent:
             relevant_date = self.find_relevant_date_spacy(question_lower, numbers_dates, entities)
             if relevant_date:
                 return f"The answer is {relevant_date}."
         elif question_type == "location":
             relevant_location = self.find_relevant_location_spacy(question_lower, entities)
             if relevant_location:
@@ -715,376 +773,107 @@ class SuperSmartAgent:
             headers = [self._clean_cell_content(cell).lower() for cell in table[0]] if table else []
             data_rows = table[1:] if len(table) > 1 else []
-            # Determine column types
             column_types = self.detect_column_types(table)
-            # Check if table is relevant to the question by checking headers and sample data
-            table_is_relevant = any(phrase.lower() in ' '.join(headers) for phrase in question_keywords) or \
-                                any(any(phrase.lower() in self._clean_cell_content(cell).lower() for phrase in question_keywords) for row in data_rows for cell in row[:min(len(row), 3)]) # Check first few cells of first few rows
-            if not table_is_relevant:
-                continue
-            # Prioritize based on question type
-            if "how many" in question_lower or "what was the" in question_lower or "total" in question_lower:
-                numeric_columns_indices = [i for i, col_type in enumerate(column_types) if col_type == 'number']
-                if numeric_columns_indices and data_rows:
-                    best_match_score = -1
-                    best_numeric_answer = None
-                    for row in data_rows:
-                        row_text_lower = ' '.join([self._clean_cell_content(c).lower() for c in row])
-                        # Score row based on how many question keywords it contains
-                        row_score = sum(1 for kw in question_keywords if kw.lower() in row_text_lower)
-                        if row_score > best_match_score:
-                            for col_idx in numeric_columns_indices:
-                                if col_idx < len(row):
-                                    cell_content = self._clean_cell_content(row[col_idx])
-                                    numbers = re.findall(r'(\d[\d,]*\d*)', cell_content)
-                                    if numbers:
-                                        # Take the first number found in the cell
-                                        clean_num = numbers[0].replace(',', '')
-                                        if clean_num.isdigit():
-                                            best_match_score = row_score
-                                            best_numeric_answer = clean_num
-                                            break # Found a number, move to next row if not the best
-                    if best_numeric_answer:
-                        return f"The answer is {best_numeric_answer}."
-            elif "who" in question_lower or "which person" in question_lower or "player" in question_lower:
-                name_columns_indices = [i for i, col_type in enumerate(column_types) if col_type == 'name']
-                if name_columns_indices and data_rows:
-                    best_match_score = -1
-                    best_name_answer = None
-                    for row in data_rows:
-                        row_text_lower = ' '.join([self._clean_cell_content(c).lower() for c in row])
-                        row_score = sum(1 for kw in question_keywords if kw.lower() in row_text_lower)
-                        if row_score > best_match_score:
-                            for col_idx in name_columns_indices:
-                                if col_idx < len(row):
-                                    cell_content = self._clean_cell_content(row[col_idx])
-                                    # Check if the cell content looks like a name using spaCy
-                                    doc_cell = nlp(cell_content)
-                                    if any(ent.label_ == "PERSON" for ent in doc_cell.ents):
-                                        best_match_score = row_score
-                                        best_name_answer = cell_content.strip()
-                                        break
-                    if best_name_answer:
-                        return f"The answer is {best_name_answer}."
-            elif "when" in question_lower or "year" in question_lower or "date" in question_lower:
-                date_columns_indices = [i for i, col_type in enumerate(column_types) if col_type == 'date']
-                if date_columns_indices and data_rows:
-                    best_match_score = -1
-                    best_date_answer = None
-                    for row in data_rows:
-                        row_text_lower = ' '.join([self._clean_cell_content(c).lower() for c in row])
-                        row_score = sum(1 for kw in question_keywords if kw.lower() in row_text_lower)
-                        if row_score > best_match_score:
-                            for col_idx in date_columns_indices:
-                                if col_idx < len(row):
-                                    cell_content = self._clean_cell_content(row[col_idx])
-                                    # Use more robust date detection
-                                    if re.search(r'\b(19|20)\d{2}\b', cell_content) or \
-                                       re.search(r'\b\d{1,2}\s+(Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec)\w*\s*\d{4}\b', cell_content, re.IGNORECASE):
-                                        best_match_score = row_score
-                                        best_date_answer = cell_content.strip()
-                                        break
-                    if best_date_answer:
-                        return f"The answer is {best_date_answer}."
         return None
     def detect_column_types(self, table):
         """
-        Detects the type of data in each column (e.g., 'number', 'name', 'date', 'text').
-        Uses spaCy for better entity recognition.
         """
-        if not table:
             return []
-        num_columns = len(table[0]) if table else 0
-        column_types = ['text'] * num_columns
-        # Sample a few rows to determine type
-        sample_rows = table[1:min(len(table), 5)]
-        for col_idx in range(num_columns):
-            col_values = [self._clean_cell_content(row[col_idx]) for row in sample_rows if col_idx < len(row)]
             num_count = 0
-            name_count = 0
             date_count = 0
-            for value in col_values:
-                value_doc = nlp(value)
-                # Check for numbers
-                if re.fullmatch(r'[\d,.-]+', value.replace(' ', '')): # Allow for decimals, negatives, commas
-                    num_count += 1
-                # Check for dates
-                if any(ent.label_ == "DATE" for ent in value_doc.ents):
-                    date_count += 1
-                elif re.search(r'\b\d{4}\b|\b\d{1,2}/\d{1,2}/\d{2,4}\b', value):
-                    date_count += 1
-                # Check for names (PERSON entity)
-                if any(ent.label_ == "PERSON" for ent in value_doc.ents):
-                    name_count += 1
-            # Heuristic to assign type: majority rules or strong indicators
-            if len(col_values) > 0:
-                if num_count / len(col_values) > 0.7: # More than 70% numbers
-                    column_types[col_idx] = 'number'
-                elif date_count / len(col_values) > 0.7: # More than 70% dates
-                    column_types[col_idx] = 'date'
-                elif name_count / len(col_values) > 0.5 and num_count == 0: # More than 50% names and no numbers
-                    column_types[col_idx] = 'name'
-                # Default remains 'text'
         return column_types
-    def column_looks_like_names(self, sample_values):
-        """Checks if a sample of values from a column primarily contains names using spaCy."""
-        if not sample_values:
-            return False
-        name_like_count = 0
-        for value in sample_values:
-            doc = nlp(value)
-            # A value looks like a name if spaCy identifies a PERSON entity
-            if any(ent.label_ == "PERSON" for ent in doc.ents):
-                name_like_count += 1
-        return name_like_count / len(sample_values) > 0.6 # Majority are name-like
-    class AgentState(TypedDict, total=False):
-        question: str
-        is_reversed: bool
-        is_python: bool
-        is_riddle: bool
-        is_wiki: bool
-        needs_reasoning: bool
-        response: str
-        use_tool: str
-        # Add current_context to state for find_relevant_person_spacy etc.
-        current_context: str # Stores the context retrieved from Wikipedia
-    def _build_graph(self):
-        # Nested functions need access to 'self' for the new methods.
-        # One way is to pass 'self' or make them direct methods of the class.
-        # For simplicity and to fit the graph builder, I'll assume `self`
-        # is implicitly available or methods are bound later.
-        # In this updated code, I've moved the modified/new functions directly
-        # into the SuperSmartAgent class as methods.
-        # The graph nodes will then call self.method_name.
-        # Ensure the graph nodes correctly reference the class methods
-        # For the graph to work, these need to be callable methods of the class.
-        # So we adapt the node definitions:
-        builder = StateGraph(self.AgentState)
-        builder.add_node("check_reversed", self.check_reversed_node)
-        builder.add_node("fix_question", self.fix_question_node)
-        builder.add_node("check_riddle_or_trick", self.check_riddle_or_trick_node)
-        builder.add_node("solve_riddle", self.solve_riddle_node)
-        builder.add_node("check_wikipedia_suitability", self.check_wikipedia_suitability_node)
-        builder.add_node("check_reasoning_needed", self.check_reasoning_needed_node)
-        builder.add_node("general_reasoning_qa", self.general_reasoning_qa_node)
-        builder.add_node("check_python_suitability", self.check_python_suitability_node)
-        builder.add_node("generate_code", self.generate_code_node)
-        builder.add_node("fallback", self.fallback_node)
-        # Bind the functions as methods of the class for the graph to call them
-        # This is a common pattern when using StateGraph with class methods
-        # The methods need to be defined outside _build_graph as instance methods
-        # I've defined them above as regular methods, so this part simplifies.
-        # Rename the nested functions to be class methods or use wrappers
-        # For simplicity, I'm just renaming the graph nodes to call self.method
-        # Make sure the actual function implementations are now class methods.
-        # Define wrapper methods to fit the graph signature if needed, or
-        # directly call the class methods from the graph nodes.
-        # Here, I'm directly renaming the graph calls to assume the original
-        # functions are now methods.
-        # Set entry point and define edges
-        builder.set_entry_point("check_reversed")
-        builder.add_edge("check_reversed", "fix_question")
-        builder.add_edge("fix_question", "check_riddle_or_trick")
-        builder.add_conditional_edges(
-            "check_riddle_or_trick",
-            lambda s: "solve_riddle" if s.get("is_riddle") else "check_wikipedia_suitability"
-        )
-        builder.add_conditional_edges(
-            "check_wikipedia_suitability",
-            lambda s: "general_reasoning_qa" if s.get("is_wiki") else "check_reasoning_needed" # Go directly to general_reasoning_qa for wiki
-        )
-        builder.add_conditional_edges(
-            "check_reasoning_needed",
-            lambda s: "general_reasoning_qa" if s.get("needs_reasoning") else "check_python_suitability"
-        )
-        builder.add_conditional_edges(
-            "check_python_suitability",
-            lambda s: "generate_code" if s.get("is_python") else "fallback"
         )
-        builder.add_edge("solve_riddle", END)
-        builder.add_edge("general_reasoning_qa", END)
-        builder.add_edge("generate_code", END)
-        builder.add_edge("fallback", END)
-        return builder.compile()
-    # --- Wrapper methods for the graph nodes ---
-    # These call the actual logic methods. This is a common pattern
-    # when your graph functions are class methods and need `self`.
-    def check_reversed_node(self, state):
-        return self._check_reversed(state)
-    def fix_question_node(self, state):
-        return self._fix_question(state)
-    def check_riddle_or_trick_node(self, state):
-        return self._check_riddle_or_trick(state)
-    def solve_riddle_node(self, state):
-        return self._solve_riddle(state)
-    def check_wikipedia_suitability_node(self, state):
-        return self._check_wikipedia_suitability(state)
-    def check_reasoning_needed_node(self, state):
-        return self._check_reasoning_needed(state)
-    def general_reasoning_qa_node(self, state):
-        # Before calling general_reasoning_qa, ensure current_context is set up
-        # This part of the logic might need to be shifted depending on graph flow.
-        # For now, general_reasoning_qa itself will fetch context.
-        response_state = self.general_reasoning_qa(state)
-        # Update current_context in the state if it was retrieved, for consistency
-        # although general_reasoning_qa itself uses it internally.
-        # This is a bit tricky with StateGraph if context isn't explicitly passed around
-        # or stored in the state by the `general_reasoning_qa` function itself.
-        # The `find_relevant_person_spacy` and similar methods now assume `self.current_context`
-        # is available. The `general_reasoning_qa` method *should* set it.
-        return response_state
-    def check_python_suitability_node(self, state):
-        return self._check_python_suitability(state)
-    def generate_code_node(self, state):
-        return self._generate_code(state)
-    def fallback_node(self, state):
-        return self._fallback(state)
-    # --- Renamed original helper functions to be internal methods ---
-    # These are the actual implementations, now as instance methods.
-    def _check_reversed(self, state):
-        question = state["question"]
-        reversed_candidate = question[::-1]
-        original_score = self._score_text(question)
-        reversed_score = self._score_text(reversed_candidate)
-        if reversed_score > original_score:
-            state["is_reversed"] = True
-        else:
-            state["is_reversed"] = False
-        return state
-    def _fix_question(self, state):
-        if state.get("is_reversed", False):
-            state["question"] = state["question"][::-1]
-        return state
-    def _check_riddle_or_trick(self, state):
-        q = state["question"].lower()
-        keywords = ["opposite of", "if you understand", "riddle", "trick question", "what comes next", "i speak without"]
-        state["is_riddle"] = any(kw in q for kw in keywords)
-        return state
-    def _solve_riddle(self, state):
-        q = state["question"].lower()
-        if "opposite of the word" in q:
-            if "left" in q:
-                state["response"] = "right"
-            elif "up" in q:
-                state["response"] = "down"
-            elif "hot" in q:
-                state["response"] = "cold"
-            else:
-                state["response"] = "Unknown opposite."
-        else:
-            state["response"] = "Could not solve riddle."
-        return state
-    def _check_python_suitability(self, state):
-        question = state["question"].lower()
-        patterns = ["sum", "average", "count", "sort", "generate", "regex", "convert"]
-        state["is_python"] = any(word in question for word in patterns)
-        return state
-    def _generate_code(self, state):
-        q = state["question"].lower()
-        if "sum" in q:
-            state["response"] = "numbers = [1, 2, 3]\nprint(sum(numbers))"
-        elif "average" in q:
-            state["response"] = "numbers = [1, 2, 3]\nprint(sum(numbers) / len(numbers))"
-        elif "sort" in q:
-            state["response"] = "data = [3, 1, 2]\ndata.sort()\nprint(data)"
-        else:
-            state["response"] = "# Code generation not implemented for this case."
-        return state
-    def _fallback(self, state):
-        state["response"] = "This question doesn't require Python or is unclear."
-        return state
-    def _check_reasoning_needed(self, state):
-        q = state["question"].lower()
-        needs_reasoning = any(word in q for word in ["whose", "only", "first", "after", "before", "no longer", "not", "but", "except"])
-        state["needs_reasoning"] = needs_reasoning
-        return state
-    def _check_wikipedia_suitability(self, state):
-        q = state["question"].lower()
-        triggers = [
-            "wikipedia", "who is", "what is", "when did", "where is",
-            "tell me about", "how many", "how much", "what was the",
-            "describe", "explain", "information about", "details about",
-            "history of", "facts about", "define", "give me data on"
-        ]
-        state["is_wiki"] = any(trigger in q for trigger in triggers)
-        return state
-    def _score_text(self, text):
-        alnum_count = sum(c.isalnum() for c in text)
-        space_count = text.count(' ')
-        punctuation_count = sum(c in string.punctuation for c in text)
-        ends_properly = text[-1] in '.!?'
-        score = alnum_count + space_count
-        if ends_properly:
-            score += 5
-        return score
-########################################
 def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
     Fetches all questions, runs the BasicAgent on them, submits all answers,

     nlp = spacy.load("en_core_web_sm")
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+# Define the State for the graph
+class AgentState(TypedDict):
+    question: str
+    response: str
+    is_reversed: bool
+    is_riddle: bool
+    is_python: bool
+    needs_reasoning: bool
+    is_wiki: bool
 class SuperSmartAgent:
     def __init__(self):
             extract_format=wikipediaapi.ExtractFormat.WIKI,
             user_agent='SelimResearchAgent/1.0'
         )
+        self.current_context = "" # Initialize current_context for use in methods that need it
         self.graph = self._build_graph() # Build graph after initializing wiki_wiki
     def _build_graph(self):
+        # Define the graph
+        workflow = StateGraph(AgentState)
+        # Add nodes (these will now be methods of the class)
+        workflow.add_node("check_reversed", self.check_reversed)
+        workflow.add_node("fix_question", self.fix_question)
+        workflow.add_node("check_riddle_or_trick", self.check_riddle_or_trick)
+        workflow.add_node("solve_riddle", self.solve_riddle)
+        workflow.add_node("check_python_suitability", self.check_python_suitability)
+        workflow.add_node("generate_code", self.generate_code)
+        workflow.add_node("check_reasoning_needed", self.check_reasoning_needed)
+        workflow.add_node("check_wikipedia_suitability", self.check_wikipedia_suitability)
+        workflow.add_node("general_reasoning_qa", self.general_reasoning_qa)
+        workflow.add_node("fallback", self.fallback) # A fallback node for questions that don't fit categories
+        # Set entry point
+        workflow.set_entry_point("check_reversed")
+        # Add edges
+        workflow.add_conditional_edges(
+            "check_reversed",
+            lambda state: "fix_question" if state["is_reversed"] else "check_riddle_or_trick",
+        )
+        workflow.add_edge("fix_question", "check_riddle_or_trick")
+        workflow.add_conditional_edges(
+            "check_riddle_or_trick",
+            lambda state: "solve_riddle" if state["is_riddle"] else "check_python_suitability",
+        )
+        workflow.add_edge("solve_riddle", END) # End if riddle solved
+        workflow.add_conditional_edges(
+            "check_python_suitability",
+            lambda state: "generate_code" if state["is_python"] else "check_wikipedia_suitability",
+        )
+        workflow.add_edge("generate_code", END) # End if code generated
+        workflow.add_conditional_edges(
+            "check_wikipedia_suitability",
+            lambda state: "general_reasoning_qa" if state["is_wiki"] else "fallback",
+        )
+        workflow.add_edge("general_reasoning_qa", END)
+        workflow.add_edge("fallback", END)
+        return workflow.compile()
+    def __call__(self, question: str) -> str:
+        """
+        Runs the agent's graph with the given question.
+        """
+        # Initialize state for each new question
+        initial_state = AgentState(
+            question=question,
+            response="",
+            is_reversed=False,
+            is_riddle=False,
+            is_python=False,
+            needs_reasoning=False,
+            is_wiki=False
+        )
+        final_state = self.graph.invoke(initial_state)
+        return final_state["response"]
+    # --- HELPER METHODS (NOW PART OF THE CLASS) ---
+    def score_text(self, text):
+        alnum_count = sum(c.isalnum() for c in text)
+        space_count = text.count(' ')
+        punctuation_count = sum(c in string.punctuation for c in text)
+        ends_properly = text[-1] in '.!?'
+        score = alnum_count + space_count
+        if ends_properly:
+            score += 5
+        return score
+    def check_reversed(self, state):
+        question = state["question"]
+        reversed_candidate = question[::-1]
+        original_score = self.score_text(question)
+        reversed_score = self.score_text(reversed_candidate)
+        if reversed_score > original_score:
+            state["is_reversed"] = True
+        else:
+            state["is_reversed"] = False
+        return state
+    def fix_question(self, state):
+        if state.get("is_reversed", False):
+            state["question"] = state["question"][::-1]
+        return state
+    def check_riddle_or_trick(self, state):
+        q = state["question"].lower()
+        keywords = ["opposite of", "if you understand", "riddle", "trick question", "what comes next", "i speak without"]
+        state["is_riddle"] = any(kw in q for kw in keywords)
+        return state
+    def solve_riddle(self, state):
+        q = state["question"].lower()
+        if "opposite of the word" in q:
+            if "left" in q:
+                state["response"] = "right"
+            elif "up" in q:
+                state["response"] = "down"
+            elif "hot" in q:
+                state["response"] = "cold"
             else:
+                state["response"] = "Unknown opposite."
+        else:
+            state["response"] = "Could not solve riddle."
+        return state
+    def check_python_suitability(self, state):
+        question = state["question"].lower()
+        patterns = ["sum", "average", "count", "sort", "generate", "regex", "convert"]
+        state["is_python"] = any(word in question for word in patterns)
+        return state
+    def generate_code(self, state):
+        q = state["question"].lower()
+        if "sum" in q:
+            state["response"] = "numbers = [1, 2, 3]\nprint(sum(numbers))"
+        elif "average" in q:
+            state["response"] = "numbers = [1, 2, 3]\nprint(sum(numbers) / len(numbers))"
+        elif "sort" in q:
+            state["response"] = "data = [3, 1, 2]\ndata.sort()\nprint(data)"
+        else:
+            state["response"] = "# Code generation not implemented for this case."
+        return state
+    def fallback(self, state):
+        state["response"] = "This question doesn't require Python or is unclear."
+        return state
+    def check_reasoning_needed(self, state):
+        q = state["question"].lower()
+        needs_reasoning = any(word in q for word in ["whose", "only", "first", "after", "before", "no longer", "not", "but", "except"])
+        state["needs_reasoning"] = needs_reasoning
+        return state
+    def check_wikipedia_suitability(self, state):
+        q = state["question"].lower()
+        triggers = [
+            "wikipedia", "who is", "what is", "when did", "where is",
+            "tell me about", "how many", "how much", "what was the",
+            "describe", "explain", "information about", "details about",
+            "history of", "facts about", "define", "give me data on"
+        ]
+        state["is_wiki"] = any(trigger in q for trigger in triggers)
+        return state
     def get_relevant_context(self, question, search_results):
         """
         context = re.sub(r'\[\d+\]', '', context)  # Remove [1], [2], etc.
         context = re.sub(r'<ref[^>]*>.*?<\/ref>', '', context, flags=re.DOTALL | re.IGNORECASE) # Remove <ref> tags
         context = re.sub(r'\{\{.*?\}\}', '', context, flags=re.DOTALL) # Remove {{templates}}
+        context = re.sub(r'\{\|.*?\|\}\}', '', context, flags=re.DOTALL) # Remove wiki tables (if extract_tables_from_wikipedia doesn't catch all)
         context = re.sub(r'==\s*See also\s*==.*?$', '', context, flags=re.DOTALL | re.IGNORECASE) # Remove "See also" section and anything after
         context = re.sub(r'==\s*References\s*==.*?$', '', context, flags=re.DOTALL | re.IGNORECASE) # Remove "References" section and anything after
         context = re.sub(r'\s+', ' ', context).strip() # Normalize whitespace
                 return state
             context = self.get_relevant_context(question, search_results)
+            # Store the context in an instance variable so other methods can access it
+            self.current_context = context
             if not context:
                 state["response"] = "Sorry, I couldn't find detailed relevant information."
                 return state
             if not re.search(r'\d+', answer):
                 # If question asks for a number but answer has no number, it's likely wrong
                 return False
         # Check for year/date answers for "when" questions
         if "when" in question_lower or "year" in question_lower:
             if not re.search(r'\b\d{4}\b', answer) and not re.search(r'\b(Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec)\w*\s+\d{1,2}(?:st|nd|rd|th)?,\s+\d{4}\b', answer):
             relevant_date = self.find_relevant_date_spacy(question_lower, numbers_dates, entities)
             if relevant_date:
                 return f"The answer is {relevant_date}."
         elif question_type == "location":
             relevant_location = self.find_relevant_location_spacy(question_lower, entities)
             if relevant_location:
             headers = [self._clean_cell_content(cell).lower() for cell in table[0]] if table else []
             data_rows = table[1:] if len(table) > 1 else []
+            # Determine column types (placeholder for now, needs implementation)
             column_types = self.detect_column_types(table)
+            # ... (Rest of your table search logic would go here)
+            # For now, just return a dummy answer if a table is found to avoid the error.
+            # You'll need to implement the actual table search and answer extraction logic.
+            # Example:
+            if "president" in question_lower and "usa" in question_lower and headers and "name" in headers:
+                name_col_idx = headers.index("name")
+                # More complex logic needed to find relevant row
+                return "Placeholder: Found answer in table for president question."
+            # Simple keyword match within table cells as a basic example
+            for row_idx, row in enumerate(table):
+                for cell_idx, cell_content in enumerate(row):
+                    cell_lower = cell_content.lower()
+                    if any(keyword in cell_lower for keyword in question_keywords):
+                        # This is very basic, a proper implementation would consider column headers
+                        # and question type to return a specific cell or a combination.
+                        if headers and cell_idx < len(headers):
+                            return f"Found '{cell_content}' under '{headers[cell_idx]}' in a table."
+                        else:
+                            return f"Found '{cell_content}' in a table."
         return None
     def detect_column_types(self, table):
         """
+        Detects the type of data in each column (e.g., 'number', 'text', 'date').
+        This is a placeholder and would need a robust implementation.
         """
+        if not table or not table[0]:
             return []
+        num_cols = len(table[0])
+        column_types = ["text"] * num_cols # Default to text
+        # Example: rudimentary detection for the first few rows
+        for col_idx in range(num_cols):
             num_count = 0
             date_count = 0
+            for row_idx in range(1, min(len(table), 5)): # Check first 5 data rows
+                if col_idx < len(table[row_idx]):
+                    cell_content = self._clean_cell_content(table[row_idx][col_idx])
+                    if re.match(r'^\d+(\.\d+)?$', cell_content):
+                        num_count += 1
+                    if re.match(r'\b\d{4}\b', cell_content) or re.match(r'\b(Jan|Feb|Mar)\w*\s+\d{1,2}(?:st|nd|rd|th)?(?:,\s+\d{4})?\b', cell_content, re.IGNORECASE):
+                        date_count += 1
+            if num_count > 2: # Heuristic: if more than 2 numbers
+                column_types[col_idx] = "number"
+            elif date_count > 1: # Heuristic: if more than 1 date
+                column_types[col_idx] = "date"
         return column_types
+# --- Gradio Interface (as provided, assuming it will call agent correctly) ---
+# Define the Gradio interface if needed for testing outside the main app.
+# If this is part of a larger application, this might be handled differently.
+if __name__ == '__main__':
+    agent = SuperSmartAgent() # Instantiate the agent
+    def chat_interface(question):
+        response = agent(question) # The __call__ method handles the graph invocation
+        return response
+    if os.getenv("RUN_GRADIO_APP", "false").lower() == "true":
+        demo = gr.Interface(
+            fn=chat_interface,
+            inputs=gr.Textbox(lines=2, placeholder="Enter your question here..."),
+            outputs="text",
+            title="Super Smart Agent",
+            description="An agent capable of answering questions, solving riddles, and generating Python code."
         )
+        demo.launch()
+    # Example usage for testing without Gradio:
+    print("Testing SuperSmartAgent without Gradio:")
+    my_agent = SuperSmartAgent()
+    test_questions = [
+        "What is the opposite of the word 'cold'?",
+        "How many planets are in our solar system?",
+        "Sort the list [5, 2, 8, 1]",
+        "What is the capital of France?",
+        "When was Albert Einstein born?",
+        "If I have 3 apples and you take 1, how many do I have?", # Riddle
+        "What is the population of Tokyo?",
+        "What is the sum of 10 and 20?",
+        "gnitset a si sihT", # Reversed question
+        "Who invented the telephone?"
+    ]
+    for q in test_questions:
+        print(f"\nQuestion: {q}")
+        answer = my_agent(q)
+        print(f"Answer: {answer}")
 def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
     Fetches all questions, runs the BasicAgent on them, submits all answers,