Add manuall collision detection for billiard

2020-09-28 20:05:08 +09:00 · 2020-09-28 20:05:08 +09:00 · 615ba45dde
commit 615ba45dde
parent 8c7c18854b
4 changed files with 35 additions and 17 deletions
--- a/mujoco_maze/init.py
+++ b/mujoco_maze/init.py
@ -29,7 +29,7 @@ for maze_id in TaskRegistry.keys():
            max_episode_steps=1000,
            reward_threshold=task_cls.REWARD_THRESHOLD,
        )
-        if "Rolling" in maze_id:
+        if "Billiard" in maze_id:
            continue
        # Ant
        gym.envs.register(
--- a/mujoco_maze/maze_env.py
+++ b/mujoco_maze/maze_env.py
@ -72,6 +72,9 @@ class MazeEnv(gym.Env):
            self._collision = maze_env_utils.CollisionDetector(
                structure, size_scaling, torso_x, torso_y, model_cls.RADIUS,
            )
+            self._objball_collision = maze_env_utils.CollisionDetector(
+                structure, size_scaling, torso_x, torso_y, 0.8,
+            )
        else:
            self._collision = None

@ -360,12 +363,19 @@ class MazeEnv(gym.Env):
                coords.append((j * size_scaling, i * size_scaling))
        return coords

-    def step(self, action) -> Tuple[np.ndarray, float, bool, dict]:
+    def _objball_positions(self) -> None:
+        return [
+            self.wrapped_env.get_body_com(name)[:2].copy() for name in self.object_balls
+        ]
+
+    def step(self, action: np.ndarray) -> Tuple[np.ndarray, float, bool, dict]:
        self.t += 1
        if self.wrapped_env.MANUAL_COLLISION:
            old_pos = self.wrapped_env.get_xy()
+            old_objballs = self._objball_positions()
            inner_next_obs, inner_reward, _, info = self.wrapped_env.step(action)
            new_pos = self.wrapped_env.get_xy()
+            new_objballs = self._objball_positions()
            # Checks that the new_position is in the wall
            collision = self._collision.detect(old_pos, new_pos)
            if collision is not None:
@ -375,6 +385,14 @@ class MazeEnv(gym.Env):
                    self.wrapped_env.set_xy(old_pos)
                else:
                    self.wrapped_env.set_xy(pos)
+            for name, old, new in zip(self.object_balls, old_objballs, new_objballs):
+                collision = self._objball_collision.detect(old, new)
+                if collision is not None:
+                    pos = collision.point + self._restitution_coef * collision.rest()
+                    if self._objball_collision.detect(old, pos) is not None:
+                        pos = old
+                    idx = self.wrapped_env.model.body_name2id(name)
+                    self.wrapped_env.data.xipos[idx][:2] = pos
        else:
            inner_next_obs, inner_reward, _, info = self.wrapped_env.step(action)
        next_obs = self._get_obs()
@ -394,19 +412,19 @@ def _add_object_ball(worldbody: ET.Element, i: str, j: str, x: float, y: float)
        body,
        "geom",
        type="sphere",
-        name=f"objball_geom_{i}_{j}",
-        size="1",
-        pos="0.0 0.0 0.5",
+        name=f"objball_{i}_{j}_geom",
+        size="1.0",  # Radius
+        pos="0.0 0.0 1.0",  # Z = 1.0 so that this ball can move!!
        rgba="0.1 0.1 0.7 1",
        contype="1",
        conaffinity="1",
-        mass="0.00004",
-        solimp="0.9 0.99 0.001"
+        solimp="0.9 0.99 0.001",
+        mass="0.0001",
    )
    ET.SubElement(
        body,
        "joint",
-        name=f"objball_x_{i}_{j}",
+        name=f"objball_{i}_{j}_x",
        axis="1 0 0",
        pos="0 0 0.0",
        type="slide",
@ -414,7 +432,7 @@ def _add_object_ball(worldbody: ET.Element, i: str, j: str, x: float, y: float)
    ET.SubElement(
        body,
        "joint",
-        name=f"objball_y_{i}_{j}",
+        name=f"objball_{i}_{j}_y",
        axis="0 1 0",
        pos="0 0 0",
        type="slide",
@ -422,7 +440,7 @@ def _add_object_ball(worldbody: ET.Element, i: str, j: str, x: float, y: float)
    ET.SubElement(
        body,
        "joint",
-        name=f"objball_rot_{i}_{j}",
+        name=f"objball_{i}_{j}_rot",
        axis="0 0 1",
        pos="0 0 0",
        type="hinge",
--- a/mujoco_maze/maze_task.py
+++ b/mujoco_maze/maze_task.py
@ -27,7 +27,7 @@ class MazeGoal:
        reward_scale: float = 1.0,
        rgb: Rgb = RED,
        threshold: float = 0.6,
-        custom_size: Optional[float] = None
+        custom_size: Optional[float] = None,
    ) -> None:
        assert 0.0 <= reward_scale <= 1.0
        self.pos = pos
@ -330,7 +330,7 @@ class DistRewardBlockMaze(GoalRewardBlockMaze, DistRewardMixIn):
    pass


-class GoalRewardRolling(MazeTask):
+class GoalRewardBilliard(MazeTask):
    REWARD_THRESHOLD: float = 0.9
    PENALTY: float = -0.0001
    MAZE_SIZE_SCALING: Scaling = Scaling(4.0, 3.0, 3.0)
@ -360,7 +360,7 @@ class GoalRewardRolling(MazeTask):
        ]


-class DistRewardRolling(GoalRewardRolling):
+class DistRewardBilliard(GoalRewardBilliard):
    def reward(self, obs: np.ndarray) -> float:
        return -self.goals[0].euc_dist(obs[3:6]) / self.scale

@ -375,7 +375,7 @@ class TaskRegistry:
        "4Rooms": [DistReward4Rooms, GoalReward4Rooms, SubGoal4Rooms],
        "TRoom": [DistRewardTRoom, GoalRewardTRoom],
        "BlockMaze": [DistRewardBlockMaze, GoalRewardBlockMaze],
-        "Rolling": [DistRewardRolling, GoalRewardRolling],
+        "Billiard": [DistRewardBilliard, GoalRewardBilliard],
    }

    @staticmethod
--- a/tests/test_envs.py
+++ b/tests/test_envs.py
@ -6,7 +6,7 @@ import mujoco_maze

@pytest.mark.parametrize("maze_id", mujoco_maze.TaskRegistry.keys())
 def test_ant_maze(maze_id):
-    if "Rolling" in maze_id:
+    if "Billiard" in maze_id:
        return
    for i in range(2):
        env = gym.make(f"Ant{maze_id}-v{i}")
@ -38,7 +38,7 @@ def test_point_maze(maze_id):

@pytest.mark.parametrize("maze_id", mujoco_maze.TaskRegistry.keys())
 def test_reacher_maze(maze_id):
-    for inhibited in ["Fall", "Push", "Block", "Rolling"]:
+    for inhibited in ["Fall", "Push", "Block", "Billiard"]:
        if inhibited in maze_id:
            return
    for i in range(2):
@ -52,7 +52,7 @@ def test_reacher_maze(maze_id):

@pytest.mark.parametrize("maze_id", mujoco_maze.TaskRegistry.keys())
 def test_swimmer_maze(maze_id):
-    for inhibited in ["Fall", "Push", "Block", "Rolling"]:
+    for inhibited in ["Fall", "Push", "Block", "Billiard"]:
        if inhibited in maze_id:
            return
    for i in range(2):