mirror of
https://github.com/vale981/ray
synced 2025-03-09 12:56:46 -04:00
166 lines
5.3 KiB
Python
166 lines
5.3 KiB
Python
import unittest
|
|
|
|
import gym
|
|
import numpy as np
|
|
|
|
from ray.rllib.utils.serialization import (
|
|
gym_space_from_dict,
|
|
gym_space_to_dict,
|
|
space_from_dict,
|
|
space_to_dict,
|
|
)
|
|
from ray.rllib.utils.spaces.flexdict import FlexDict
|
|
from ray.rllib.utils.spaces.repeated import Repeated
|
|
from ray.rllib.utils.spaces.simplex import Simplex
|
|
|
|
|
|
def _assert_array_equal(eq, a1, a2, margin=None):
|
|
for a in zip(a1, a2):
|
|
eq(a[0], a[1], margin)
|
|
|
|
|
|
class TestGymCheckEnv(unittest.TestCase):
|
|
def test_box_space(self):
|
|
env = gym.make("CartPole-v0")
|
|
d = gym_space_to_dict(env.observation_space)
|
|
sp = gym_space_from_dict(d)
|
|
|
|
obs_space = env.observation_space
|
|
_assert_array_equal(
|
|
self.assertAlmostEqual, sp.low.tolist(), obs_space.low.tolist(), 0.001
|
|
)
|
|
_assert_array_equal(
|
|
self.assertAlmostEqual, sp.high.tolist(), obs_space.high.tolist(), 0.001
|
|
)
|
|
_assert_array_equal(self.assertEqual, sp._shape, obs_space._shape)
|
|
self.assertEqual(sp.dtype, obs_space.dtype)
|
|
|
|
def test_discrete_space(self):
|
|
env = gym.make("CartPole-v0")
|
|
d = gym_space_to_dict(env.action_space)
|
|
sp = gym_space_from_dict(d)
|
|
|
|
action_space = env.action_space
|
|
self.assertEqual(sp.n, action_space.n)
|
|
|
|
def test_multi_discrete_space(self):
|
|
md_space = gym.spaces.MultiDiscrete(nvec=np.array([3, 4, 5]))
|
|
d = gym_space_to_dict(md_space)
|
|
sp = gym_space_from_dict(d)
|
|
|
|
_assert_array_equal(self.assertAlmostEqual, sp.nvec, md_space.nvec, 0.001)
|
|
self.assertEqual(md_space.dtype, sp.dtype)
|
|
|
|
def test_tuple_space(self):
|
|
env = gym.make("CartPole-v0")
|
|
space = gym.spaces.Tuple(spaces=[env.observation_space, env.action_space])
|
|
d = gym_space_to_dict(space)
|
|
sp = gym_space_from_dict(d)
|
|
|
|
_assert_array_equal(
|
|
self.assertAlmostEqual,
|
|
sp.spaces[0].low.tolist(),
|
|
space.spaces[0].low.tolist(),
|
|
0.001,
|
|
)
|
|
_assert_array_equal(
|
|
self.assertAlmostEqual,
|
|
sp.spaces[0].high.tolist(),
|
|
space.spaces[0].high.tolist(),
|
|
0.001,
|
|
)
|
|
_assert_array_equal(
|
|
self.assertEqual, sp.spaces[0]._shape, space.spaces[0]._shape
|
|
)
|
|
self.assertEqual(sp.dtype, space.dtype)
|
|
|
|
self.assertEqual(sp.spaces[1].n, space.spaces[1].n)
|
|
|
|
def test_dict_space(self):
|
|
env = gym.make("CartPole-v0")
|
|
space = gym.spaces.Dict(
|
|
spaces={"obs": env.observation_space, "action": env.action_space}
|
|
)
|
|
d = gym_space_to_dict(space)
|
|
sp = gym_space_from_dict(d)
|
|
|
|
_assert_array_equal(
|
|
self.assertAlmostEqual,
|
|
sp.spaces["obs"].low.tolist(),
|
|
space.spaces["obs"].low.tolist(),
|
|
0.001,
|
|
)
|
|
_assert_array_equal(
|
|
self.assertAlmostEqual,
|
|
sp.spaces["obs"].high.tolist(),
|
|
space.spaces["obs"].high.tolist(),
|
|
0.001,
|
|
)
|
|
_assert_array_equal(
|
|
self.assertEqual, sp.spaces["obs"]._shape, space.spaces["obs"]._shape
|
|
)
|
|
self.assertEqual(sp.dtype, space.dtype)
|
|
|
|
self.assertEqual(sp.spaces["action"].n, space.spaces["action"].n)
|
|
|
|
def test_simplex_space(self):
|
|
space = Simplex(shape=(3, 4), concentration=np.array((1, 2, 1)))
|
|
|
|
d = gym_space_to_dict(space)
|
|
sp = gym_space_from_dict(d)
|
|
|
|
_assert_array_equal(self.assertEqual, space.shape, sp.shape)
|
|
_assert_array_equal(
|
|
self.assertAlmostEqual, space.concentration, sp.concentration
|
|
)
|
|
self.assertEqual(space.dtype, sp.dtype)
|
|
|
|
def test_repeated(self):
|
|
space = Repeated(gym.spaces.Box(low=-1, high=1, shape=(1, 200)), max_len=8)
|
|
|
|
d = gym_space_to_dict(space)
|
|
sp = gym_space_from_dict(d)
|
|
|
|
self.assertTrue(isinstance(sp.child_space, gym.spaces.Box))
|
|
self.assertEqual(space.max_len, sp.max_len)
|
|
self.assertEqual(space.dtype, sp.dtype)
|
|
|
|
def test_flex_dict(self):
|
|
space = FlexDict({})
|
|
space["box"] = gym.spaces.Box(low=-1, high=1, shape=(1, 200))
|
|
space["discrete"] = gym.spaces.Discrete(2)
|
|
space["tuple"] = gym.spaces.Tuple(
|
|
(gym.spaces.Box(low=-1, high=1, shape=(1, 200)), gym.spaces.Discrete(2))
|
|
)
|
|
|
|
d = gym_space_to_dict(space)
|
|
sp = gym_space_from_dict(d)
|
|
|
|
self.assertTrue(isinstance(sp["box"], gym.spaces.Box))
|
|
self.assertTrue(isinstance(sp["discrete"], gym.spaces.Discrete))
|
|
self.assertTrue(isinstance(sp["tuple"], gym.spaces.Tuple))
|
|
|
|
def test_original_space(self):
|
|
space = gym.spaces.Box(low=0.0, high=1.0, shape=(10,))
|
|
space.original_space = gym.spaces.Dict(
|
|
{
|
|
"obs1": gym.spaces.Box(low=0.0, high=1.0, shape=(3,)),
|
|
"obs2": gym.spaces.Box(low=0.0, high=1.0, shape=(7,)),
|
|
}
|
|
)
|
|
|
|
d = space_to_dict(space)
|
|
sp = space_from_dict(d)
|
|
|
|
self.assertTrue(isinstance(sp, gym.spaces.Box))
|
|
self.assertTrue(isinstance(sp.original_space, gym.spaces.Dict))
|
|
self.assertTrue(isinstance(sp.original_space["obs1"], gym.spaces.Box))
|
|
self.assertTrue(isinstance(sp.original_space["obs2"], gym.spaces.Box))
|
|
|
|
|
|
if __name__ == "__main__":
|
|
import sys
|
|
|
|
import pytest
|
|
|
|
sys.exit(pytest.main(["-v", __file__]))
|