From d6a96021d242bd72194a139bf9715d37aeb28a0a Mon Sep 17 00:00:00 2001 From: kngwyu Date: Wed, 30 Sep 2020 13:39:32 +0900 Subject: [PATCH] Renew Subgoal Billiard --- mujoco_maze/maze_task.py | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/mujoco_maze/maze_task.py b/mujoco_maze/maze_task.py index 065ad95..fc8d993 100644 --- a/mujoco_maze/maze_task.py +++ b/mujoco_maze/maze_task.py @@ -388,8 +388,8 @@ class SubGoalBilliard(GoalRewardBilliard): def __init__( self, scale: float, - primary_goal: Tuple[float, float] = (2.0, -3.0), - subgoal: Tuple[float, float] = (-2.0, -3.0), + primary_goal: Tuple[float, float] = (4.0, -3.0), + subgoal: Tuple[float, float] = (4.0, 1.0), ) -> None: super().__init__(scale, primary_goal) self.goals.append( @@ -408,10 +408,11 @@ class SubGoalBilliard(GoalRewardBilliard): R, M = MazeCell.ROBOT, MazeCell.OBJECT_BALL return [ [B, B, B, B, B, B, B], + [B, E, E, B, B, E, B], [B, E, E, E, E, E, B], [B, E, E, E, B, B, B], - [B, E, E, M, E, E, B], - [B, E, E, R, E, E, B], + [B, R, M, E, E, E, B], + [B, E, E, E, E, E, B], [B, B, B, B, B, B, B], ]