Spaces:

alter-ego-app
/

alter_ego_api_test

Sleeping

App Files Files Community

alter_ego_api_test / core.py

igiuseppe

Fix JSON response parsing in ux_testing_fsm function to directly access the response object.

0e5d4ec 10 months ago

raw

history blame contribute delete

18.1 kB

	import json
	from typing import List, Dict, Any
	from pydantic import BaseModel
	from concurrent.futures import ThreadPoolExecutor
	from utils import call_llm
	import logging
	from prompts import (
	GENERATE_USER_PARAMETERS_PROMPT,
	GENERATE_SYNTHETIC_PERSONAS_PROMPT,
	CHAT_WITH_PERSONA_PROMPT,
	ASK_QUESTIONS_TO_PERSONA_PROMPT,
	GENERATE_REPORT_PROMPT,
	CHAT_WITH_REPORT_PROMPT,
	GENERATE_AUDIENCE_NAME_PROMPT,
	UX_FSM_SIMPLE_PROMPT,
	persona_schema,
	answers_schema
	)

	logger = logging.getLogger(__name__)

	MAX_WORKERS=10

	def generate_user_parameters(audience: str, scope: str,n:int=24) -> List[str]:
	standard_parameters = ["Name", "Age", "Location", "Profession"]
	n_general=20
	n_specific=n-n_general
	prompt = GENERATE_USER_PARAMETERS_PROMPT.format(
	audience=audience,
	scope=scope,
	standard_parameters=standard_parameters,
	n=n,
	n_specific=n_specific,
	n_general=n_general
	)

	class Response(BaseModel):
	additional_parameters: list[str]

	response = call_llm(prompt=prompt, response_format=Response,model_type="mid",temperature=0)
	additional_parameters = json.loads(response)["additional_parameters"]

	return standard_parameters + additional_parameters

	def build_previous_personas_context(previous_personas: List[Dict[str, Any]]) -> str:
	previous_personas_context = "\n\n--- Existing Personas Context ---\n"
	for i, persona in enumerate(previous_personas, 1):
	previous_personas_context += f"\nExisting Persona {i}:\n"
	persona_str = "\n".join([f"{param}: {value}" for param, value in persona.items() if param != 'answers'])
	previous_personas_context += persona_str + "\n"
	previous_personas_context += "--- End Existing Personas Context ---"
	# Update requirement text only if context is added
	return previous_personas_context

	def generate_synthetic_personas(num_personas: int, audience: str, previous_personas: List[Dict[str, Any]] = None) -> Dict:
	"""
	Generate synthetic personas, ensuring variability by considering previously generated personas.
	Retries LLM calls if fewer personas than requested are returned, up to a limit.

	Args:
	parameters: List of parameters to include in each persona
	num_personas: Total number of personas to generate
	audience: Target audience for the personas
	previous_personas: Optional list of already existing personas to ensure differentiation.

	Returns:
	Dictionary containing the list of newly generated personas
	"""
	all_new_personas = []
	max_iterations = 5 # Safety break to prevent infinite loops
	current_iteration = 0

	while len(all_new_personas) < num_personas and current_iteration < max_iterations:
	current_iteration += 1
	needed_personas = num_personas - len(all_new_personas)
	logger.info(f"Iteration {current_iteration}/{max_iterations}: Requesting {needed_personas} more personas (Total needed: {num_personas}, Have: {len(all_new_personas)})...")
	response_format = persona_schema(needed_personas)

	# Combine original previous_personas with those generated in this function's previous iterations
	current_context_personas = (previous_personas or []) + all_new_personas

	prompt = GENERATE_SYNTHETIC_PERSONAS_PROMPT.format(
	needed_personas=needed_personas,
	audience=audience
	)
	if current_context_personas:
	# Add context and the requirement for differentiation
	prompt += "\n\n"
	prompt += f"To ensure diversity, we have already generated {len(current_context_personas)} persona(s) for this audience. Their details are listed below.\n"
	prompt += "LAST IMPORTANT REQUIREMENT: Each new persona you generate MUST be significantly different from these existing ones.\n"
	prompt += build_previous_personas_context(current_context_personas) # Appends the formatted list

	try:
	response_str = call_llm(prompt=prompt, response_format=response_format,temperature=1, model_type="mid",shuffle=False)
	response_data = json.loads(response_str)
	users_list = response_data.get("users_personas", [])

	iteration_personas = users_list

	num_received_iteration = len(iteration_personas)
	logger.info(f"Iteration {current_iteration}: Received {num_received_iteration} personas (requested {needed_personas}).")

	if num_received_iteration == 0 and needed_personas > 0:
	logger.warning(f"Iteration {current_iteration}: Received 0 personas despite needing {needed_personas}. Stopping attempts for this request.")
	break # Stop if LLM returns 0 when we still need more

	all_new_personas.extend(iteration_personas)

	except Exception as e:
	logger.error(f"Iteration {current_iteration}: Error during LLM call or processing: {e}")
	# Optionally break or continue based on desired robustness
	# For now, let's break if an error occurs during an iteration
	break

	# Final check and logging
	if len(all_new_personas) < num_personas:
	logger.warning(f"generate_synthetic_personas finished after {current_iteration} iterations, but only generated {len(all_new_personas)}/{num_personas} requested personas.")
	else:
	logger.info(f"generate_synthetic_personas successfully generated {len(all_new_personas)} personas in {current_iteration} iterations.")

	return {"users_personas": all_new_personas}


	# Renamed and simplified: Processes one question for one persona
	def ask_single_question_to_persona(persona: dict, question: str) -> str:
	"""Asks a single question to a single persona and returns the answer."""
	try:
	prompt = CHAT_WITH_PERSONA_PROMPT.format(
	persona=persona,
	question=question
	)
	answer = call_llm(prompt=prompt,temperature=0, model_type="low",shuffle=False)
	return answer
	except Exception as e:
	logger.error(f"Error asking question '{question}' to persona {persona.get('Name', 'Unknown')}: {e}")
	return f"Error generating answer for question: {question}"

	def ask_all_questions_to_persona(persona: dict, questions: List[str],context:str=None) -> str:
	"""Asks a single question to a single persona and returns the answer."""

	response_format = answers_schema(len(questions))

	try:
	prompt = ASK_QUESTIONS_TO_PERSONA_PROMPT.format(
	persona=persona,
	questions=questions,
	num_questions=len(questions)
	)
	if context:
	prompt += f"\n\nHere is some context that might be relevant to the questions: {context}"
	response_str = call_llm(prompt=prompt,temperature=0.5, model_type="mid",response_format=response_format,shuffle=False)
	response_data = json.loads(response_str)
	answers = response_data.get("answers", [])
	return answers
	except Exception as e:
	logger.error(f"Error asking questions to persona {persona.get('Name', 'Unknown')}: {e}")
	return f"Error generating answers"

	def add_answers_to_users_bulk(users_personas: List, questions: List[str],context:str=None) -> List[Dict]:
	"""
	Adds answers to each user persona by asking all questions at once for each persona.
	Processes all personas in parallel for better efficiency.

	Args:
	users_personas: List of user personas
	questions: List of questions to ask each persona

	Returns:
	List of personas with their answers added
	"""
	personas_list = users_personas
	if not personas_list or not questions:
	# Return original personas if no personas or no questions
	for p in personas_list:
	p["answers"] = [] # Ensure 'answers' key exists even if empty
	return personas_list

	# Helper function to process a single persona with all questions
	def process_persona(persona):
	try:
	answers = ask_all_questions_to_persona(persona, questions,context)
	persona["answers"] = answers
	return persona
	except Exception as e:
	logger.error(f"Error processing all questions for persona {persona.get('Name', 'Unknown')}: {e}")
	persona["answers"] = ["Error generating answer"] * len(questions)
	return persona

	# Process all personas in parallel
	max_workers = min(MAX_WORKERS, len(personas_list))
	with ThreadPoolExecutor(max_workers=max_workers) as executor:
	updated_personas = list(executor.map(process_persona, personas_list))

	return updated_personas

	def add_answers_to_users(users_personas: List, questions: List[str]) -> List[Dict]:
	"""
	Adds answers to each user persona by processing a flat list of (persona, question) pairs in parallel.
	Ensures the order of answers matches the order of questions for each persona.
	"""
	personas_list = users_personas
	if not personas_list or not questions:
	# Return original personas if no personas or no questions
	for p in personas_list:
	p["answers"] = [] # Ensure 'answers' key exists even if empty
	return personas_list

	num_questions = len(questions)

	# 1. Create the flat list of tasks: [(persona, question), ...]
	# We need the original persona object in each task
	tasks = []
	for persona in personas_list:
	for question in questions:
	tasks.append((persona, question)) # Tuple of (persona_dict, question_str)

	# Helper function to be mapped, unpacks the tuple
	def process_task(task_tuple):
	persona_dict, question_str = task_tuple
	return ask_single_question_to_persona(persona_dict, question_str)

	flat_answers = []
	# Adjust max_workers based on total tasks and API limits
	max_workers = min(MAX_WORKERS, len(tasks)) # Increased potential workers
	with ThreadPoolExecutor(max_workers=max_workers) as executor:
	# 2. Process tasks in parallel, map preserves order
	flat_answers = list(executor.map(process_task, tasks))

	# 3. Reconstruct the fleet with ordered answers
	fleet = []
	answer_index = 0
	for persona in personas_list:
	# Slice the flat_answers list to get answers for the current persona
	persona_answers = flat_answers[answer_index : answer_index + num_questions]
	persona["answers"] = persona_answers
	fleet.append(persona)
	answer_index += num_questions # Move index to the start of the next persona's answers

	return fleet

	def generate_content(fleet,questions=None,scope=None) -> str:
	content = ""
	if scope:
	content += f"Scope of Research:\n{scope}\n\n"
	if questions:
	content += "Questions:\n"
	for i, question in enumerate(questions, 1):
	content += f"Q{i}: {question}\n"
	content += "\n"
	for i, user in enumerate(fleet, 1):
	content += f"### User {i} ###\n"
	for key, value in user.items():
	if key != "answers":
	content += f"{key}: {value}\n"
	content += "\n"
	for j, answer in enumerate(user.get("answers", []), 1):
	content += f"Q{j}: {answer}\n\n"
	content += "\n---\n\n"
	return content

	def generate_report(questions,fleet,scope) -> str:
	content=generate_content(questions=questions,fleet=fleet,scope=scope)

	prompt = GENERATE_REPORT_PROMPT.format(
	content=content,
	scope=scope
	)
	report_text = call_llm(prompt=prompt,model_type="mid",temperature=0)

	return report_text

	def chat_with_persona(persona: dict, question: str, conversation_history: List[dict] = None) -> str:
	"""
	Chat with a specific persona, taking into account conversation history if provided.

	Args:
	persona: The user persona to chat with
	question: The current question to ask
	conversation_history: List of previous Q&A pairs, if any

	Returns:
	The persona's answer to the question
	"""
	history_context = ""
	if conversation_history:
	history_context = "\nPrevious conversation:\n"
	for chat in conversation_history:
	history_context += f"Q: {chat['question']}\n"
	history_context += f"A: {chat['answer']}\n"

	prompt = CHAT_WITH_PERSONA_PROMPT.format(
	persona=persona,
	question=question
	)
	if conversation_history:
	prompt += f"\nHere you have the previous conversation, make sure to answer the question in a way that is consistent with it:\n{history_context}"
	return call_llm(prompt=prompt,temperature=0.5, model_type="mid",shuffle=False)

	def chat_with_report(users: List[dict], question: str, questions: List[str]) -> str:
	"""
	Chat with the content of a report, using the provided users' data.

	Args:
	users: List of user personas with their answers (fleet)
	question: The question to ask about the report content
	questions: List of questions that were asked to the users

	Returns:
	The answer based on the report content
	"""
	# Generate the content string that would be used in the report
	content = generate_content(fleet=users, questions=questions)

	prompt = CHAT_WITH_REPORT_PROMPT.format(
	content=content,
	question=question
	)
	return call_llm(prompt=prompt,temperature=0, model_type="low")

	def generate_audience_name(audience: str, scope: str) -> str:
	"""
	Generate a concise audience name based on the provided audience description and scope.

	Args:
	audience: Detailed audience description
	scope: Research scope

	Returns:
	String containing a concise audience name
	"""
	prompt = GENERATE_AUDIENCE_NAME_PROMPT.format(
	audience=audience,
	scope=scope
	)

	audience_name = call_llm(prompt=prompt, temperature=0, model_type="low")
	return audience_name.strip()

	def ux_testing_fsm(persona: dict, task: str, image: str, available_actions: list, session_history: list = None) -> dict:
	"""
	Conduct simple FSM-based UX testing with a persona.

	Args:
	persona: User persona to conduct testing with
	task: The task the persona needs to accomplish
	image: URL of the current interface image
	available_actions: List of available actions in current state
	session_history: List of previous steps in this session

	Returns:
	Dictionary with action_taken, thought, task_finished, and task_difficulty
	"""

	# Format available actions
	actions_text = ", ".join(available_actions)

	# Format session history
	if session_history:
	history_text = "Previous steps in this session:\n"
	for i, step in enumerate(session_history, 1):
	history_text += f"Step {i}: Action '{step.get('action_taken', 'unknown')}' - {step.get('thought', 'No thought recorded')}\n"
	else:
	history_text = "This is the first step of the session."

	prompt = UX_FSM_SIMPLE_PROMPT.format(
	persona=persona,
	task=task,
	available_actions=actions_text,
	session_history=history_text
	)

	# Define response format for structured JSON
	response_format = {
	"type": "json_schema",
	"json_schema": {
	"name": "ux_testing_response",
	"schema": {
	"type": "object",
	"properties": {
	"action_taken": {
	"type": "string",
	"description": "The action chosen from available actions",
	"enum": available_actions
	},
	"thought": {
	"type": "string",
	"description": "Reasoning for the action"
	},
	"task_finished": {
	"type": "boolean",
	"description": "Whether the task is complete"
	},
	"task_difficulty": {
	"type": ["number", "null"],
	"minimum": 1.0,
	"maximum": 5.0,
	"description": "Difficulty rating if task is finished"
	}
	},
	"required": ["action_taken", "thought", "task_finished", "task_difficulty"],
	"additionalProperties": False
	},
	"strict": True
	}
	}

	try:
	# Call LLM with the image and structured response format
	response = call_llm(
	prompt=prompt,
	temperature=0.7,
	model_type="mid",
	images=[image],
	response_format=response_format
	)

	# Parse JSON response
	parsed_response = json.loads(response)

	# Validate action is in available actions
	if parsed_response.get("action_taken") not in available_actions:
	logger.warning(f"Persona chose invalid action: {parsed_response.get('action_taken')}. Using first available action.")
	parsed_response["action_taken"] = available_actions[0] if available_actions else "unknown"

	logger.info(f"UX FSM testing completed for persona: {persona.get('Name', 'Unknown')}")
	logger.info(f"Action taken: {parsed_response.get('action_taken')}")
	logger.info(f"Task finished: {parsed_response.get('task_finished')}")

	return parsed_response

	except Exception as e:
	logger.error(f"Error during UX FSM testing for persona {persona.get('Name', 'Unknown')}: {e}")
	return {
	"action_taken": available_actions[0] if available_actions else "unknown",
	"thought": f"Error occurred during testing: {str(e)}",
	"task_finished": False,
	"task_difficulty": None
	}