import evoagentx.workflow.operators as operator import examples.aflow.humaneval.optimized.round_9.prompt as prompt_custom from evoagentx.models.model_configs import LLMConfig from evoagentx.benchmark.benchmark import Benchmark from evoagentx.models.model_utils import create_llm_instance class Workflow: def __init__( self, name: str, llm_config: LLMConfig, benchmark: Benchmark ): self.name = name self.llm = create_llm_instance(llm_config) self.benchmark = benchmark self.custom = operator.Custom(self.llm) self.custom_code_generate = operator.CustomCodeGenerate(self.llm) self.test = operator.Test(self.llm) # New operator for testing solutions async def __call__(self, problem: str, entry_point: str): """ Implementation of the workflow Custom operator to generate anything you want. But when you want to get standard code, you should use custom_code_generate operator. """ # Generate multiple solutions for a robust selection process solutions = [] for _ in range(3): # Generate 3 potential solutions response = await self.custom_code_generate(problem=problem, entry_point=entry_point, instruction=prompt_custom.GENERATE_PYTHON_CODE_PROMPT) solutions.append(response['response']) # Use self-ensemble approach to select the best solution based on frequency ensemble_solution = await self.custom(input="Solutions: " + ", ".join(solutions), instruction=prompt_custom.ScEN_PYTHON_SELECTION_PROMPT) # Testing the selected ensemble solution test_result = await self.test(problem=problem, solution=ensemble_solution['response'], entry_point=entry_point, benchmark=self.benchmark) if test_result['result']: return test_result['solution'] # Return the validated solution else: return "The generated solution did not pass the tests." # Handle failed tests