diff --git a/mujoco_maze/maze_task.py b/mujoco_maze/maze_task.py index 9d36a1e..52afbbe 100644 --- a/mujoco_maze/maze_task.py +++ b/mujoco_maze/maze_task.py @@ -249,7 +249,7 @@ class GoalRewardTRoom(MazeTask): def __init__( self, scale: float, - goals: List[Tuple[float, float]] = [(2.0, -3.0)], + goals: List[Tuple[float, float]] = [(2.0, -4.0)], ) -> None: super().__init__(scale) self.goals = [] @@ -270,6 +270,7 @@ class GoalRewardTRoom(MazeTask): [B, E, E, B, E, E, B], [B, E, E, B, E, E, B], [B, E, B, B, B, E, B], + [B, E, E, E, E, E, B], [B, E, E, R, E, E, B], [B, B, B, B, B, B, B], ] diff --git a/tests/test_envs.py b/tests/test_envs.py index 6e925a1..76e8190 100644 --- a/tests/test_envs.py +++ b/tests/test_envs.py @@ -28,7 +28,7 @@ def test_point_maze(maze_id): @pytest.mark.parametrize("v", [0, 1]) def test_maze_args(v): - env = gym.make(f"PointTRoom-v{v}", task_kwargs={"goals": [(-2.0, -3.0)]}) + env = gym.make(f"PointTRoom-v{v}", task_kwargs={"goals": [(-2.0, -4.0)]}) assert env.reset().shape == (7,) s, _, _, _ = env.step(env.action_space.sample()) assert s.shape == (7,)