Spaces:

s-b3
/

LifeStack

Sleeping

LifeStack / tests /test_reward_reasoning.py

Soham Banerjee

deploy: pure lifestack with partitioned wisdom pool

77da5ce about 1 month ago

2.04 kB

	import sys
	import os
	sys.path.append(os.getcwd())

	from core.reward import compute_task_reward
	from core.life_state import LifeMetrics
	from core.task import Task

	def test_reasoning_alignment_pass():
	"""Verify that reasoning mentioning the action category gets higher score."""
	state = LifeMetrics()
	task = Task(
	"test",
	"career",
	"test",
	{}, {}, {}, {}, # constraints, hidden, mutable, visible
	[], [], # success, failure
	[], [], [], # events, routes, milestones
	10, 1, {} # horizon, diff, metadata
	)

	# Action: SPEND, Reasoning: mentions cost
	_, res_match = compute_task_reward(
	state_before=state, state_after=state, resources_used={}, actions_taken=1,
	milestones_achieved=[], success_conditions_met=[], exo_events_seen=0,
	milestones_after_event=0, routes_remaining=1, rollback_used=False,
	cascade_collapse=False, task=task, action_type="spend",
	reasoning="I am doing this because the cost is low."
	)

	# Action: SPEND, Reasoning: mentions nothing relevant
	_, res_mismatch = compute_task_reward(
	state_before=state, state_after=state, resources_used={}, actions_taken=1,
	milestones_achieved=[], success_conditions_met=[], exo_events_seen=0,
	milestones_after_event=0, routes_remaining=1, rollback_used=False,
	cascade_collapse=False, task=task, action_type="spend",
	reasoning="I am doing this because I am happy."
	)

	score_match = res_match["components"]["reasoning"]
	score_mismatch = res_mismatch["components"]["reasoning"]

	print(f"Match Score: {score_match}")
	print(f"Mismatch Score: {score_mismatch}")

	assert score_match > score_mismatch, f"Match {score_match} should be > Mismatch {score_mismatch}"
	print("✅ Reasoning alignment test passed!")

	if __name__ == "__main__":
	try:
	test_reasoning_alignment_pass()
	except Exception as e:
	print(f"❌ Test failed: {e}")
	sys.exit(1)