Spaces:

nat232
/

student_sample_panel

Build error

App Files Files Community

scormon-predata-ai commited on Jun 25, 2025

Commit

0bd36cc

verified ·

1 Parent(s): b75c907

Update researchsimulation/InteractiveInterviewChatbot.py

Browse files

Files changed (1) hide show

researchsimulation/InteractiveInterviewChatbot.py +130 -87

researchsimulation/InteractiveInterviewChatbot.py CHANGED Viewed

@@ -43,7 +43,6 @@ def parse_question_with_llm(question, respondent_names, processor_llm):
            - **Correct (British):** organised, prioritise, minimise, realise, behaviour, centre, defence, travelling, practise (verb), licence (noun), programme, aeroplane.
            - **Incorrect (American):** organized, prioritize, minimize, realize, behavior, center, defense, traveling, practice (verb and noun), license (noun), program, airplane.
     6. Ensure that you follow the **Formatting Rules** exactly. THIS IS EXTREMELY IMPORTANT.
     ### Examples:
     - "Sourav, do you agree with this topic?" → "Do you agree with this topic?"
     - "What do you think about this topic, Divya?" → "What do you think about this topic?"
@@ -55,7 +54,6 @@ def parse_question_with_llm(question, respondent_names, processor_llm):
     - "Divya, what did you learn from this program?" → "What did you learn from this programme?"
     - "How do you stay organized, Rahul?" → "How do you stay organised?"
     - "Meena, how do you balance work and traveling?" → "How do you balance work and travelling?"
     ### **Formatting Rules**:
     For each question identified, respond using **only** the following format:
     - Respondent: <Respondent Name>
@@ -206,100 +204,85 @@ def validate_question_topics(parsed_questions, processor_llm):
-def generate_generic_answer(agent_name, agent_question, respondent_agent):
-    """
-    Generate a raw, generic answer in first person, British English, without applying any specific style or tone.
-    """
-    task_prompt = f"""
-You are {agent_name}. Respond to the question below **in first person**, using British English.
-Focus only on answering naturally and authentically. Do not apply any specific tone or style.
-### Question:
-"{agent_question}"
-"""
-    raw_response_task = Task(description=task_prompt, expected_output="", agent=respondent_agent)
-    crew = Crew(agents=[respondent_agent], tasks=[raw_response_task], process=Process.sequential)
-    crew.kickoff()
-    return raw_response_task.output.raw.strip()
-def stylise_answer(raw_response, communication_style, agent_name, processor_llm):
     """
-    Rephrase the answer to match the respondent's style and tone, using British English.
     """
-    style_prompt = f"""
-Rephrase the following response into a {communication_style} tone using British English.
-Keep it in first person and do not change the meaning.
-### Original Response:
-"{raw_response}"
-"""
-    return processor_llm.invoke(style_prompt).content.strip()
-def validate_final_answer(answer, agent_name):
-    """
-    Validate the final answer. Returns a formatted string or an error message if invalid.
-    """
-    if not answer:
-        return f"**{agent_name}**: I wasn't able to answer right now – can you try again?"
-    return f"**{agent_name}**: {answer}"
-def run_interview_pipeline(respondent_agents_dict, last_active_agent, question, processor_llm):
-    logging.info(f"Received question: {question}")
     agent_names = list(respondent_agents_dict.keys())
     # Step 1: Parse question
     parsed_questions = parse_question_with_llm(question, str(agent_names), processor_llm)
     if not parsed_questions:
         return ["**PreData Moderator**: No valid respondents were detected for this question."]
-    # Step 2: Validate parsed questions
     validated_questions = validate_question_topics(parsed_questions, processor_llm)
-    for resp, q in validated_questions.items():
-        if q == "INVALID":
             return ["**PreData Moderator**: The question is invalid. Please ask another question."]
-    parsed_questions = validated_questions
-    # Handle multiple respondents
     if len(parsed_questions) > 1:
-        return ["**PreData Moderator**: Please ask each respondent one question at a time."]
-    # Handle "General" or "All"
-    # [Insert logic here – reuse your existing handling of General/All]
     last_active_agent = list(parsed_questions.keys())
-    responses = []
-    # === MAIN LOOP ===
     for agent_name, agent_question in parsed_questions.items():
-        agent_entry = respondent_agents_dict.get(agent_name)
-        if not agent_entry:
             responses.append(f"**PreData Moderator**: {agent_name} is not a valid respondent.")
             continue
-        respondent_agent = agent_entry.get_agent()
-        user_profile = agent_entry.get_user_profile()
-        #        communication_style = user_profile.get_field("Communication", "Style")
         communication_style = ""
         question_task_description = f"""
 You are {agent_name}. You are responding to a market research interview question. Your response must strictly follow the *style and tone* and *Hard Rules – You Must Follow These Without Exception* outlined below.
 ---
@@ -324,7 +307,7 @@ You are {agent_name}. You are responding to a market research interview question
         -Example:
             Q: Where are you from?
             A: I’m from [city], [country](DO NOT ADD ANY EXTRA COMMENTS).
-    -For reflective or opinion-based questions (e.g., feelings, preferences, motivations), provide thoughtful but still clear and focused answers.
     -Never repeat the question or add unrelated background information.
 ---
 ### **How to Answer:**
@@ -333,8 +316,8 @@ You are {agent_name}. You are responding to a market research interview question
 - Adapt your **sentence structure, phrasing, and word choices** to match the intended communication style.
 - If applicable, incorporate **culturally relevant expressions, regional nuances, or industry-specific terminology** that fit the given tone.
 - **Adjust response length** based on the tone—**concise and direct** for casual styles, **structured and detailed** for professional styles.
-- **Always answer in first person (\"I\", \"my\", \"me\", \"mine\", etc.) as if you are personally responding to the question. You are an individual representing yourself, not speaking in third person.**
-    -Always answer as if you are the individual being directly spoken to. Use first-person language such as “I,” “me,” “my,” and “mine” in every response. Imagine you are having a real conversation — your tone should feel natural, personal, and authentic. Do not refer to yourself in the third person (e.g., “She is from Trichy” or “Meena likes…”). Avoid describing yourself as if someone else is talking about you.
     -Everything you say should come from your own perspective, just like you would in everyday speech. The goal is to sound human, relatable, and direct — like you're truly present in the conversation.
 ---
 ### **Guidelines for Ensuring Authenticity & Alignment:**
@@ -354,7 +337,7 @@ You are {agent_name}. You are responding to a market research interview question
   - If the tone is formal, use a structured and professional format.
 - **Do not include emojis or hashtags in the response.**
 - Maintain **narrative and thematic consistency** across all answers to simulate a coherent personality.
--**Personality Profile Alignment:
     -Consider your assigned personality traits across these dimensions:
         -Big Five Traits:
             -Openness: Reflect your level of curiosity, creativity, and openness to new experiences
@@ -387,24 +370,84 @@ Your final answer should be **a well-structured response that directly answers t
 **"{agent_question}"**
         """
         question_task_expected_output = f"""
 A culturally authentic and conversational response to the question: '{agent_question}'.
 - The response must reflect the respondent's **local cultural background and geographic influences**, ensuring it aligns with their **speech patterns, preferences, and linguistic style**.
-- The language must follow **strict British English spelling conventions**, ensuring it is **natural, personal, and free-flowing**, while strictly avoiding American spelling, phrasing, or grammar under any circumstances, regardless of the spelling, grammar, or vocabulary used in the input question.
 - The response **must not introduce the respondent**, nor include placeholders like "[Your Name]" or "[Brand Name]".
-- The response **must always be written in first person (\"I\", \"my\", \"me\", etc.) as if the respondent is personally answering the question directly. Third-person narration is never allowed.**
 - The final output should be a **single, well-structured paragraph that directly answers the question** while staying fully aligned with the specified communication style.
         """
-        # Step 1: Generate generic answer
-        raw_response = generate_generic_answer(agent_name, agent_question, respondent_agent)
-        # Step 2: Stylise answer
-        styled_response = stylise_answer(raw_response, communication_style, agent_name, processor_llm)
-        # Step 3: Validate answer
-        formatted_response = validate_final_answer(styled_response, agent_name)
-        responses.append(formatted_response)
-    return responses

            - **Correct (British):** organised, prioritise, minimise, realise, behaviour, centre, defence, travelling, practise (verb), licence (noun), programme, aeroplane.
            - **Incorrect (American):** organized, prioritize, minimize, realize, behavior, center, defense, traveling, practice (verb and noun), license (noun), program, airplane.
     6. Ensure that you follow the **Formatting Rules** exactly. THIS IS EXTREMELY IMPORTANT.
     ### Examples:
     - "Sourav, do you agree with this topic?" → "Do you agree with this topic?"
     - "What do you think about this topic, Divya?" → "What do you think about this topic?"
     - "Divya, what did you learn from this program?" → "What did you learn from this programme?"
     - "How do you stay organized, Rahul?" → "How do you stay organised?"
     - "Meena, how do you balance work and traveling?" → "How do you balance work and travelling?"
     ### **Formatting Rules**:
     For each question identified, respond using **only** the following format:
     - Respondent: <Respondent Name>
+def ask_interview_question(respondent_agents_dict, last_active_agent, question, processor_llm):
     """
+    Handles both individual and group interview questions while tracking conversation flow.
+    Uses OpenAI's LLM to extract the intended respondent(s) and their specific question(s).
+    Uses Groq's LLM for response generation.
     """
+    logging.info(f"START: Processing new interview question: {question}")
+    responses = []
     agent_names = list(respondent_agents_dict.keys())
+    logging.info(f"Available respondents: {agent_names}")
+    print(f"Available respondents: {agent_names}")
+    # Use OpenAI LLM to parse questions into individual respondent-specific sub-questions and validate them
     # Step 1: Parse question
+    logging.info("STEP 1: Parsing question with LLM...")
     parsed_questions = parse_question_with_llm(question, str(agent_names), processor_llm)
+    logging.info(f"Parsed Questions Output: {parsed_questions}")
     if not parsed_questions:
+        logging.warning("No questions were parsed from input.")
         return ["**PreData Moderator**: No valid respondents were detected for this question."]
+    # Step 2: Validate question content (scope + spelling)
+    logging.info("STEP 2: Validating questions for topic relevance and British English...")
     validated_questions = validate_question_topics(parsed_questions, processor_llm)
+    logging.info(f"Validated Questions: {validated_questions}")
+    for resp_name, extracted_question in validated_questions.items():
+        if extracted_question == "INVALID":
+            logging.warning(f"Invalid question detected for {resp_name}: {extracted_question}")
             return ["**PreData Moderator**: The question is invalid. Please ask another question."]
+    # Use validated questions from this point on
+    parsed_questions = validated_questions
+    logging.info(f"Validated questions: {parsed_questions}")
     if len(parsed_questions) > 1:
+        logging.warning("More than one respondent specified. Exiting function.")
+        return "**PreData Moderator**: Please ask each respondent one question at a time."
+    else:
+        print(f"Parsed questions are: {parsed_questions}")
+    if "General" in parsed_questions:
+        if "General" in parsed_questions:
+            if isinstance(last_active_agent, list) and all(name in agent_names for name in last_active_agent):
+                logging.info(f"General case detected. Continuing with last active agent: {last_active_agent}")
+                parsed_questions = {name: parsed_questions["General"] for name in last_active_agent}
+            else:
+                logging.info("General case detected without a valid previous active agent. Assigning question to all respondents.")
+                parsed_questions = {name: parsed_questions["General"] for name in agent_names}
+    elif "All" in parsed_questions:
+        logging.info("All case detected. Assigning question to all respondents.")
+        validated_question = parsed_questions["All"]
+        parsed_questions = {name: validated_question for name in agent_names}
     last_active_agent = list(parsed_questions.keys())
+    logging.info(f"Final parsed questions: {parsed_questions}")
+    # Construct one crew and task for each agent and question
+    responses = []
     for agent_name, agent_question in parsed_questions.items():
+        if agent_name not in respondent_agents_dict:
+            logging.warning(f"No valid respondent found for {agent_name}. Skipping.")
             responses.append(f"**PreData Moderator**: {agent_name} is not a valid respondent.")
             continue
+        respondent_agent = respondent_agents_dict[agent_name].get_agent()
+        user_profile     = respondent_agents_dict[agent_name].get_user_profile()
+#        communication_style = user_profile.get_field("Communication", "Style")
         communication_style = ""
         question_task_description = f"""
 You are {agent_name}. You are responding to a market research interview question. Your response must strictly follow the *style and tone* and *Hard Rules – You Must Follow These Without Exception* outlined below.
 ---
         -Example:
             Q: Where are you from?
             A: I’m from [city], [country](DO NOT ADD ANY EXTRA COMMENTS).
+    -For reflective or opinion-based questions (e.g., feelings, preferences, motivations), provide thoughtful but still clear and focused answers.
     -Never repeat the question or add unrelated background information.
 ---
 ### **How to Answer:**
 - Adapt your **sentence structure, phrasing, and word choices** to match the intended communication style.
 - If applicable, incorporate **culturally relevant expressions, regional nuances, or industry-specific terminology** that fit the given tone.
 - **Adjust response length** based on the tone—**concise and direct** for casual styles, **structured and detailed** for professional styles.
+- **Always answer in first person ("I", "my", "me", "mine", etc.) as if you are personally responding to the question. You are an individual representing yourself, not speaking in third person.**
+    -Always answer as if you are the individual being directly spoken to. Use first-person language such as “I,” “me,” “my,” and “mine” in every response. Imagine you are having a real conversation — your tone should feel natural, personal, and authentic. Do not refer to yourself in the third person (e.g., “She is from Trichy” or “Meena likes…”). Avoid describing yourself as if someone else is talking about you.
     -Everything you say should come from your own perspective, just like you would in everyday speech. The goal is to sound human, relatable, and direct — like you're truly present in the conversation.
 ---
 ### **Guidelines for Ensuring Authenticity & Alignment:**
   - If the tone is formal, use a structured and professional format.
 - **Do not include emojis or hashtags in the response.**
 - Maintain **narrative and thematic consistency** across all answers to simulate a coherent personality.
+-**Personality Profile Alignment:**
     -Consider your assigned personality traits across these dimensions:
         -Big Five Traits:
             -Openness: Reflect your level of curiosity, creativity, and openness to new experiences
 **"{agent_question}"**
         """
         question_task_expected_output = f"""
 A culturally authentic and conversational response to the question: '{agent_question}'.
 - The response must reflect the respondent's **local cultural background and geographic influences**, ensuring it aligns with their **speech patterns, preferences, and linguistic style**.
+- The language must follow **strict British English spelling conventions**, ensuring it is **natural, personal, and free-flowing**, while strictly avoiding American spelling, phrasing, or grammar under any circumstances, regardless of the spelling, grammar, or vocabulary used in the input question.
 - The response **must not introduce the respondent**, nor include placeholders like "[Your Name]" or "[Brand Name]".
+- The response **must always be written in first person ("I", "my", "me", etc.) as if the respondent is personally answering the question directly. Third-person narration is never allowed.**
 - The final output should be a **single, well-structured paragraph that directly answers the question** while staying fully aligned with the specified communication style.
         """
+        question_task = Task(
+            description=question_task_description,
+            expected_output=question_task_expected_output,
+            agent=respondent_agent
+        )
+        logging.debug(f"Created task for agent '{agent_name}' with description: {question_task_description}")
+        # Log before starting task execution
+        logging.info(f"Executing task for agent '{agent_name}'")
+        # Create a new crew for each agent-question pair
+        crew = Crew(
+            agents=[respondent_agent],
+            tasks=[question_task],
+            process=Process.sequential
+        )
+        logging.debug(f"Crew initialized for agent '{agent_name}' with 1 task and sequential process")
+        max_attempts = 3
+        attempt = 0
+        validated = False
+        validated_answer = None
+        while attempt < max_attempts and not validated:
+            try:
+                logging.info(f"Starting Response validation attempt {attempt+1} for agent '{agent_name}'")
+                crew_output = crew.kickoff()
+                logging.info(f"Task execution completed for agent '{agent_name}' (attempt {attempt+1})")
+                task_output = question_task.output
+                logging.debug(f"Raw output from agent '{agent_name}': {getattr(task_output, 'raw', str(task_output))}")
+                answer = task_output.raw if hasattr(task_output, 'raw') else str(task_output)
+                logging.info(f"Validating response for agent '{agent_name}' (attempt {attempt+1}): {answer}")
+                # Validate the response using validate_response from validation_utils
+                is_valid = validate_response(
+                    question=agent_question,
+                    answer=answer,
+                    user_profile_str=str(user_profile),
+                    fast_facts_str="",
+                    interview_transcript_text="",
+                    respondent_type=agent_name,
+                    ai_evaluator_agent=None,
+                    processor_llm=processor_llm
+                )
+                logging.info(f"Response Validation result for agent '{agent_name}' (attempt {attempt+1}): {is_valid}")
+                if is_valid:
+                    validated = True
+                    validated_answer = answer
+                    logging.info(f"Response for agent '{agent_name}' passed validation on attempt {attempt+1}")
+                    break
+                else:
+                    attempt += 1
+                    logging.warning(f"Response failed response validation for agent '{agent_name}' (attempt {attempt}). Retrying...")
+            except Exception as e:
+                logging.error(f"Error during task execution for agent '{agent_name}' (attempt {attempt+1}): {str(e)}", exc_info=True)
+                attempt += 1
+        # --- End validation and retry loop ---
+        if validated_answer:
+            formatted_response = f"**{agent_name}**: {validated_answer}"
+            responses.append(formatted_response)
+            logging.info(f"Validated response from agent '{agent_name}' added to responses")
+        else:
+            fallback_response = f"**PreData Moderator**: Unable to pass validation after {max_attempts} attempts for {agent_name}."
+            responses.append(fallback_response)
+            logging.warning(f"No validated output from agent '{agent_name}' after {max_attempts} attempts. Added fallback response.")
+    logging.info(f"All responses generated: {responses}")
+    if len(set(parsed_questions.values())) == 1:
+        combined_output = "\n\n".join(responses)
+        return [combined_output]
+    else:
+        return responses