diff --git a/mujoco_maze/maze_task.py b/mujoco_maze/maze_task.py index 7c19e98..9d36a1e 100644 --- a/mujoco_maze/maze_task.py +++ b/mujoco_maze/maze_task.py @@ -249,7 +249,7 @@ class GoalRewardTRoom(MazeTask): def __init__( self, scale: float, - goals: List[Tuple[float, float]] = [(2.0, -4.0)], + goals: List[Tuple[float, float]] = [(2.0, -3.0)], ) -> None: super().__init__(scale) self.goals = [] @@ -267,7 +267,6 @@ class GoalRewardTRoom(MazeTask): E, B, R = MazeCell.EMPTY, MazeCell.BLOCK, MazeCell.ROBOT return [ [B, B, B, B, B, B, B], - [B, E, E, E, E, E, B], [B, E, E, B, E, E, B], [B, E, E, B, E, E, B], [B, E, B, B, B, E, B], diff --git a/tests/test_envs.py b/tests/test_envs.py index 76e8190..6e925a1 100644 --- a/tests/test_envs.py +++ b/tests/test_envs.py @@ -28,7 +28,7 @@ def test_point_maze(maze_id): @pytest.mark.parametrize("v", [0, 1]) def test_maze_args(v): - env = gym.make(f"PointTRoom-v{v}", task_kwargs={"goals": [(-2.0, -4.0)]}) + env = gym.make(f"PointTRoom-v{v}", task_kwargs={"goals": [(-2.0, -3.0)]}) assert env.reset().shape == (7,) s, _, _, _ = env.step(env.action_space.sample()) assert s.shape == (7,)