Spaces:

OpenDILabCommunity
/

gomoku

Running

init space

3dfe8fb about 2 years ago

1.03 kB

	import pytest
	import gym
	import numpy as np
	from easydict import EasyDict
	from dizoo.pomdp.envs import PomdpAtariEnv


	@pytest.mark.envtest
	def test_env():
	cfg = {
	'env_id': 'Pong-ramNoFrameskip-v4',
	'frame_stack': 4,
	'is_train': True,
	'warp_frame': False,
	'clip_reward': False,
	'use_ram': True,
	'render': False,
	'pomdp': dict(noise_scale=0.001, zero_p=0.1, reward_noise=0.01, duplicate_p=0.2)
	}

	cfg = EasyDict(cfg)
	pong_env = PomdpAtariEnv(cfg)
	pong_env.seed(0)
	obs = pong_env.reset()
	act_dim = pong_env.info().act_space.shape[0]
	while True:
	random_action = np.random.choice(range(act_dim), size=(1, ))
	timestep = pong_env.step(random_action)
	assert timestep.obs.shape == (512, )
	assert timestep.reward.shape == (1, )
	# assert isinstance(timestep, tuple)
	if timestep.done:
	assert 'eval_episode_return' in timestep.info, timestep.info
	break
	pong_env.close()