Spaces:

hmqid03
/

vietqa-api

Sleeping

quanho114

Add chat mode support - natural responses without MCQ format

55f1010 24 days ago

11.7 kB

	"""Logic solver node implementing a Manual Code Execution workflow."""

	import re
	import string

	from langchain_core.messages import BaseMessage, HumanMessage, SystemMessage
	from langchain_experimental.utilities import PythonREPL

	from src.data_processing.answer import extract_answer
	from src.data_processing.formatting import format_choices
	from src.state import GraphState
	from src.utils.llm import get_large_model
	from src.utils.logging import print_log
	from src.utils.prompts import load_prompt

	_python_repl = PythonREPL()


	def extract_python_code(text: str) -> str \| None:
	"""Find and extract Python code from block ``` python ... ```"""
	match = re.search(r"```(?:python)?\s(.?)```", text, re.DOTALL \| re.IGNORECASE)
	if match:
	return match.group(1).strip()
	return None


	def _validate_code_syntax(code: str) -> tuple[bool, str]:
	"""Check if code has valid Python syntax. Returns (is_valid, error_message)."""
	try:
	compile(code, "<string>", "exec")
	return True, ""
	except SyntaxError as e:
	return False, str(e)


	def _is_placeholder_code(code: str) -> bool:
	"""Check if code contains placeholders or is incomplete."""
	if not code or len(code.strip()) < 10:
	return True
	if "..." in code:
	return True
	# Check for {key}-style placeholders (but not f-string or dict literals)
	if re.search(r"\{[a-zA-Z_][a-zA-Z0-9_]*\}", code):
	# Exclude common dict/set patterns and f-strings
	if not re.search(r'["\'][^"\']*\{[a-zA-Z_]', code):
	return True
	return False


	def _indent_code(code: str) -> str:
	"""Format code to make it easier to read in the terminal."""
	return "\n".join(f" {line}" for line in code.splitlines())


	def _fallback_text_reasoning(llm, question: str, choices_text: str) -> dict:
	"""Fallback to CoT reasoning when code execution fails."""
	print_log(" [Logic] Falling back to CoT reasoning...")

	fallback_system = (
	"Nhiệm vụ của bạn là trả lời câu hỏi "
	"được đưa ra bằng khả năng phân tích và suy luận logic. "
	"Hãy phân tích vấn đề và suy luận đề từng bước một. "
	"Cuối cùng, hãy trả lời theo đúng định dạng: 'Đáp án: X' "
	"trong đó X là ký tự đại diện cho lựa chọn đúng (A, B, C, D, ...)."
	)

	fallback_user = (
	f"Câu hỏi: {question}\n"
	f"{choices_text}"
	)

	fallback_messages: list[BaseMessage] = [
	SystemMessage(content=fallback_system),
	HumanMessage(content=fallback_user)
	]

	fallback_response = llm.invoke(fallback_messages)
	fallback_content = fallback_response.content
	print_log(f" [Logic] Fallback response received.")

	return {"text": fallback_content}


	def _request_final_answer(llm, question: str, choices_text: str, computed_results: str) -> str:
	"""Request a strict final answer from the model."""
	system_prompt = (
	"Bạn là trợ lý AI. Dựa vào kết quả tính toán được cung cấp, "
	"hãy đưa ra đáp án cuối cùng. CHỈ trả lời đúng một dòng: Đáp án: X "
	"(trong đó X là A, B, C hoặc D)."
	)
	user_prompt = (
	f"Câu hỏi: {question}\n"
	f"{choices_text}\n"
	f"Kết quả tính toán: {computed_results}\n\n"
	"Trả lời đúng một dòng: Đáp án: X"
	)

	messages: list[BaseMessage] = [
	SystemMessage(content=system_prompt),
	HumanMessage(content=user_prompt)
	]

	response = llm.invoke(messages)
	return response.content


	def logic_solver_node(state: GraphState) -> dict:
	"""Solve math/logic questions using Python code execution."""
	llm = get_large_model()
	all_choices = state["all_choices"]
	num_choices = len(all_choices)
	choices_text = format_choices(all_choices)
	is_chat_mode = num_choices == 0 # Chat mode when no choices

	system_prompt = load_prompt("logic_solver.j2", "system", choices=choices_text)
	user_prompt = load_prompt("logic_solver.j2", "user", question=state["question"], choices=choices_text)

	messages: list[BaseMessage] = [
	SystemMessage(content=system_prompt),
	HumanMessage(content=user_prompt)
	]

	step_texts: list[str] = []
	computed_outputs: list[str] = []

	# Chat mode: just invoke LLM and return natural response
	if is_chat_mode:
	print_log(" [Logic] Chat mode detected - returning natural response")
	response = llm.invoke(messages)
	content = response.content
	return {"answer": "", "raw_response": content, "route": "math"}

	max_steps = 5
	for step in range(max_steps):
	response = llm.invoke(messages)
	content = response.content
	step_texts.append(content)
	messages.append(response)

	code_block = extract_python_code(content)

	if code_block:
	if _is_placeholder_code(code_block):
	print_log(f" [Logic] Step {step+1}: Placeholder code detected. Requesting complete code...")
	regen_msg = (
	"Code không hợp lệ (chứa placeholder hoặc không đầy đủ). "
	"Hãy cung cấp code Python hoàn chỉnh, có thể chạy được, không chứa '...' hay placeholder. "
	"In ra các giá trị tính toán được. "
	"Cuối cùng, kết thúc bằng một dòng duy nhất: Đáp án: X (X là A, B, C hoặc D)."
	)
	messages.append(HumanMessage(content=regen_msg))
	continue

	print_log(f" [Logic] Step {step+1}: Found Python code. Executing...")

	# Validate syntax before execution
	is_valid, syntax_error = _validate_code_syntax(code_block)
	if not is_valid:
	print_log(f" [Error] Syntax error detected: {syntax_error}")
	error_msg = f"SyntaxError: {syntax_error}. "
	error_msg += "Lưu ý: KHÔNG sử dụng các từ khóa Python như 'lambda', 'class', 'def' làm tên biến. "
	error_msg += "Hãy đổi tên biến và thử lại."
	messages.append(HumanMessage(content=error_msg))
	continue

	print_log(f" [Logic] Code:\n{_indent_code(code_block)}")

	try:
	if "print" not in code_block:
	lines = code_block.splitlines()
	if lines:
	last_line = lines[-1]
	if "=" in last_line:
	var_name = last_line.split("=")[0].strip()
	else:
	var_name = last_line.strip()
	code_block += f"\nprint({var_name})"

	output = _python_repl.run(code_block)
	output = output.strip() if output else "No output."
	print_log(f" [Logic] Code output: {output}")
	computed_outputs.append(output)

	# Do NOT extract answer from code output directly
	# Instead, feed output back to model and ask for final answer line
	feedback_msg = (
	f"Kết quả thực thi code: {output}\n\n"
	"Dựa vào kết quả trên, hãy so sánh với các đáp án và đưa ra câu trả lời cuối cùng. "
	"Kết thúc bằng đúng một dòng: Đáp án: X (X là A, B, C hoặc D)."
	)
	messages.append(HumanMessage(content=feedback_msg))

	except Exception as e:
	error_msg = f"Error running code: {str(e)}"
	print_log(f" [Error] {error_msg}")
	messages.append(HumanMessage(content=f"{error_msg}. Hãy kiểm tra logic và sửa lại code."))

	continue

	# Check if current step contains an explicit answer (only at end of response)
	step_answer = extract_answer(content, num_choices=num_choices, require_end=True)
	if step_answer:
	print_log(f" [Logic] Step {step+1}: Found explicit answer: {step_answer}")
	combined_raw = "\n---STEP---\n".join(step_texts)
	return {"answer": step_answer, "raw_response": combined_raw, "route": "math"}

	# Also check if response contains clear conclusion without "Đáp án:" format
	if any(phrase in content.lower() for phrase in ["kết luận", "vậy đáp án", "do đó", "vì vậy"]):
	# Try to extract any single letter at end of response
	lines = content.strip().split('\n')
	for line in reversed(lines[-3:]): # Check last 3 lines
	line = line.strip()
	if len(line) == 1 and line.upper() in string.ascii_uppercase[:num_choices]:
	print_log(f" [Logic] Step {step+1}: Found implicit answer: {line.upper()}")
	combined_raw = "\n---STEP---\n".join(step_texts)
	return {"answer": line.upper(), "raw_response": combined_raw, "route": "math"}

	if step < max_steps - 1:
	print_log(" [Warning] No code or answer found. Reminding model...")
	messages.append(HumanMessage(content="Lưu ý: Bạn vẫn chưa đưa ra đáp án cuối cùng. Hãy kết thúc bằng: Đáp án: X"))

	# Max steps reached - build combined_raw and try to extract answer
	print_log(" [Warning] Max steps reached. Attempting answer extraction from combined text...")

	# Build combined_raw from all steps
	combined_raw = "\n---STEP---\n".join(step_texts) if step_texts else ""

	# Try fallback text reasoning with error handling
	try:
	fallback_result = _fallback_text_reasoning(llm, state["question"], choices_text)
	fallback_text = fallback_result["text"]
	if fallback_text:
	combined_raw += "\n---FALLBACK---\n" + fallback_text
	except Exception as e:
	print_log(f" [Error] Fallback reasoning failed: {e}")
	fallback_text = ""

	# Extract answer from the entire combined text (takes LAST explicit answer)
	final_answer = extract_answer(combined_raw, num_choices=num_choices)

	if final_answer:
	print_log(f" [Logic] Extracted final answer from combined text: {final_answer}")
	return {"answer": final_answer, "raw_response": combined_raw, "route": "math"}

	# Still no answer - do one final strict LLM call with error handling
	print_log(" [Logic] No explicit answer found. Requesting strict final answer...")
	computed_str = "; ".join(computed_outputs) if computed_outputs else "Không có kết quả tính toán"
	try:
	strict_response = _request_final_answer(llm, state["question"], choices_text, computed_str)
	combined_raw += "\n---FINAL---\n" + strict_response

	final_answer = extract_answer(strict_response, num_choices=num_choices)
	if final_answer:
	print_log(f" [Logic] Final strict answer: {final_answer}")
	return {"answer": final_answer, "raw_response": combined_raw, "route": "math"}
	except Exception as e:
	print_log(f" [Error] Final answer request failed: {e}")

	# Absolute fallback - default to A
	print_log(" [Warning] All extraction attempts failed. Defaulting to A.")
	return {"answer": "A", "raw_response": combined_raw, "route": "math"}