Spaces:

Abeee32t
/

ArbitrAgent

Runtime error

ArbitrAgent / test_all_envs.py

AbeBhatti

Verification pass — all 6 tests green

d1f302c about 1 month ago

3.76 kB

	"""OpenEnv compliance tests for DiplomacyNegotiationEnv, ContractorNegotiationEnv, HumanImitationEnv."""
	import sys

	def check_env(name, env_class, has_different_resets=True):
	from openenv.env import Env
	passed = 0
	failed = []

	# MRO confirms inheritance from openenv.env.Env
	mro_names = [c.__name__ for c in env_class.__mro__]
	if "Env" in mro_names and env_class.__mro__[0] == env_class:
	print(f" {name} MRO inherits from openenv.env.Env: PASS")
	passed += 1
	else:
	print(f" {name} MRO inherits from openenv.env.Env: FAIL (MRO={mro_names})")
	failed.append("MRO")

	env = env_class()

	# reset() returns (obs, info) where obs.shape == (384,)
	obs, info = env.reset()
	if isinstance(obs, __import__("numpy").ndarray) and obs.shape == (384,):
	print(f" {name} reset() obs.shape == (384,): PASS")
	passed += 1
	else:
	sh = getattr(obs, "shape", type(obs).__name__)
	print(f" {name} reset() obs.shape == (384,): FAIL (obs.shape={sh})")
	failed.append("reset_obs_shape")

	# step(action) returns (obs, reward, done, info) with reward as real float
	try:
	obs2, reward, done, info2 = env.step("test action")
	if isinstance(reward, (int, float)) and not isinstance(reward, bool):
	print(f" {name} step() returns (obs, reward, done, info) reward float: PASS")
	passed += 1
	else:
	print(f" {name} step() reward is real float: FAIL (type={type(reward).__name__})")
	failed.append("step_reward_float")
	except Exception as e:
	print(f" {name} step() returns 4-tuple: FAIL ({e})")
	failed.append("step")

	# render() returns non-empty string
	out = env.render()
	if isinstance(out, str) and len(out.strip()) > 0:
	print(f" {name} render() non-empty string: PASS")
	passed += 1
	else:
	print(f" {name} render() non-empty string: FAIL (type={type(out).__name__}, len={len(out) if isinstance(out, str) else 'N/A'})")
	failed.append("render")

	# Each reset() gives DIFFERENT output (not hardcoded) — only for envs that support it
	if has_different_resets:
	obs_a, _ = env.reset()
	obs_b, _ = env.reset()
	diff = (obs_a != obs_b)
	if isinstance(diff, __import__("numpy").ndarray):
	different = diff.any()
	else:
	different = obs_a != obs_b
	if different:
	print(f" {name} reset() gives different output: PASS")
	passed += 1
	else:
	print(f" {name} reset() gives different output: FAIL (observations identical)")
	failed.append("reset_different")

	return passed, failed


	def main():
	print("Testing all three environments (OpenEnv compliance)")
	print("=" * 50)

	from envs.diplomacy_env import DiplomacyNegotiationEnv
	from envs.contractor_env import ContractorNegotiationEnv
	from envs.human_imitation_env import HumanImitationEnv

	total_passed = 0
	total_failed = []

	for label, env_class, different_resets in [
	("DiplomacyNegotiationEnv", DiplomacyNegotiationEnv, True),
	("ContractorNegotiationEnv", ContractorNegotiationEnv, True),
	("HumanImitationEnv", HumanImitationEnv, True),
	]:
	print(f"\n--- {label} ---")
	p, f = check_env(label, env_class, has_different_resets=different_resets)
	total_passed += p
	total_failed.extend([(label, x) for x in f])

	print("\n" + "=" * 50)
	if total_failed:
	print(f"RESULT: {total_passed} checks PASSED, {len(total_failed)} FAILED")
	sys.exit(1)
	print("All OpenEnv compliance checks passed.")
	sys.exit(0)


	if __name__ == "__main__":
	main()