fix tt issues -> context + traj.length

2022-02-08 09:50:01 +01:00 · 2022-02-08 09:50:01 +01:00 · 2a27f59e50
commit 2a27f59e50
parent 66be0b1e02
6 changed files with 58 additions and 15 deletions
--- a/alr_envs/alr/init.py
+++ b/alr_envs/alr/init.py
@ -236,6 +236,17 @@ register(
        }
    )
 # Beerpong devel big table
 register(
        id='ALRBeerPong-v3',
        entry_point='alr_envs.alr.mujoco:ALRBeerBongEnv',
        max_episode_steps=600,
        kwargs={
            "rndm_goal": True,
            "cup_goal_pos": [-0.3, -1.2]
        }
    )
 # Motion Primitive Environments
 ## Simple Reacher
@ -402,6 +413,32 @@ for _v in _versions:
    )
    ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)
 ## Beerpong- Big table devel
 register(
        id='BeerpongProMP-v3',
        entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',
        kwargs={
            "name": f"alr_envs:ALRBeerPong-v3",
            "wrappers": [mujoco.beerpong.MPWrapper],
            "mp_kwargs": {
                "num_dof": 7,
                "num_basis": 5,
                "duration": 1,
                "post_traj_time": 2,
                "policy_type": "motor",
                "weights_scale": 1,
                "zero_start": True,
                "zero_goal": False,
                "policy_kwargs": {
                    "p_gains": np.array([       1.5,   5,   2.55,    3,   2.,    2,   1.25]),
                    "d_gains": np.array([0.02333333, 0.1, 0.0625, 0.08, 0.03, 0.03, 0.0125])
                }
            }
        }
    )
 ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append('BeerpongProMP-v3')
 ## Table Tennis
 ctxt_dim = [2, 4]
 for _v, cd in enumerate(ctxt_dim):
@ -416,7 +453,7 @@ for _v, cd in enumerate(ctxt_dim):
                "num_dof": 7,
                "num_basis": 2,
                "duration": 1.25,
-                "post_traj_time": 4.5,
+                "post_traj_time": 1.5,
                "policy_type": "motor",
                "weights_scale": 1.0,
                "zero_start": True,
--- a/alr_envs/alr/mujoco/beerpong/assets/beerpong_wo_cup.xml
+++ b/alr_envs/alr/mujoco/beerpong/assets/beerpong_wo_cup.xml
@ -132,18 +132,19 @@
                </body>
            </body>
        </body>
-        <body name="table_body" pos="0 -1.85 0.4025">
+         <body name="table_body" pos="0 -2.8 0.4025">
-            <geom name="table" type="box" size="0.4 0.6 0.4" rgba="0.8 0.655 0.45 1" solimp="0.999 0.999 0.001"
+            <geom name="table" type="box" size="1.5 1.5 0.4" rgba="0.8 0.655 0.45 1" solimp="0.999 0.999 0.001"
                  solref="-10000 -100"/>
-            <geom name="table_contact_geom" type="box" size="0.4 0.6 0.1" pos="0 0 0.31" rgba="1.4 0.8 0.45 1" solimp="0.999 0.999 0.001"
+            <geom name="table_contact_geom" type="box" size="1.5 1.5 0.1" pos="0 0 0.31" rgba="1.4 0.8 0.45 1" solimp="0.999 0.999 0.001"
                  solref="-10000 -100"/>
        </body>
        <geom name="table_robot" type="box" size="0.1 0.1 0.3" pos="0 0.00 0.3025" rgba="0.8 0.655 0.45 1" solimp="0.999 0.999 0.001"
                  solref="-10000 -100"/>
-        <geom name="wall" type="box" quat="1 0 0 0" size="0.4 0.04 1.1" pos="0. -2.45 1.1" rgba="0.8 0.655 0.45 1" solimp="0.999 0.999 0.001"
+        <geom name="wall" type="box" quat="1 0 0 0" size="1.5 0.04 1.4" pos="0. -4.3 1.4" rgba="0.8 0.655 0.45 1" solimp="0.999 0.999 0.001"
                  solref="-10000 -100"/>
-        <body name="cup_table" pos="0.32 -1.55 0.84" quat="0.7071068 0.7071068 0 0">
+<!--        <body name="cup_table" pos="0.32 -1.55 0.84" quat="0.7071068 0.7071068 0 0">-->
        <body name="cup_table" pos="1.42 -1.25 0.84" quat="0.7071068 0.7071068 0 0">
            <inertial pos="-3.75236e-10 8.27811e-05 0.0947015" quat="0.999945 -0.0104888 0 0" mass="10.132" diaginertia="0.000285643 0.000270485 9.65696e-05" />
            <geom priority= "1" name="cup_geom_table3" pos="0 0.1 0.001" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup3_table" mass="10"/>
            <geom priority= "1" name="cup_geom_table4" pos="0 0.1 0.001" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup4_table" mass="10"/>
--- a/alr_envs/alr/mujoco/beerpong/beerpong.py
+++ b/alr_envs/alr/mujoco/beerpong/beerpong.py
@ -7,8 +7,11 @@ from gym.envs.mujoco import MujocoEnv
 from alr_envs.alr.mujoco.beerpong.beerpong_reward_staged import BeerPongReward
-CUP_POS_MIN = np.array([-0.32, -2.2])
+# CUP_POS_MIN = np.array([-0.32, -2.2])
-CUP_POS_MAX = np.array([0.32, -1.2])
+# CUP_POS_MAX = np.array([0.32, -1.2])
 CUP_POS_MIN = np.array([-1.42, -4.05])
 CUP_POS_MAX = np.array([1.42, -1.25])
 class ALRBeerBongEnv(MujocoEnv, utils.EzPickle):
--- a/alr_envs/alr/mujoco/table_tennis/mp_wrapper.py
+++ b/alr_envs/alr/mujoco/table_tennis/mp_wrapper.py
@ -11,9 +11,9 @@ class MPWrapper(MPEnvWrapper):
    def active_obs(self):
        # TODO: @Max Filter observations correctly
        return np.hstack([
-            [True] * 7,  # Joint Pos
+            [False] * 7,  # Joint Pos
-            [True] * 3, # Ball pos
+            [True] * 2, # Ball pos
-            [True] * 3  # goal pos
+            [True] * 2  # goal pos
        ])
    @property
--- a/alr_envs/alr/mujoco/table_tennis/tt_gym.py
+++ b/alr_envs/alr/mujoco/table_tennis/tt_gym.py
@ -10,7 +10,8 @@ from alr_envs.alr.mujoco.table_tennis.tt_reward import TT_Reward
 #TODO: Check for simulation stability. Make sure the code runs even for sim crash
-MAX_EPISODE_STEPS = 1750
+# MAX_EPISODE_STEPS = 1750
 MAX_EPISODE_STEPS = 1375
 BALL_NAME_CONTACT = "target_ball_contact"
 BALL_NAME = "target_ball"
 TABLE_NAME = 'table_tennis_table'
@ -76,10 +77,11 @@ class TTEnvGym(MujocoEnv, utils.EzPickle):
        self._ids_set = True
    def _get_obs(self):
-        ball_pos = self.sim.data.body_xpos[self.ball_id]
+        ball_pos = self.sim.data.body_xpos[self.ball_id][:2].copy()
        goal_pos = self.goal[:2].copy()
        obs = np.concatenate([self.sim.data.qpos[:7].copy(),  # 7 joint positions
                              ball_pos,
-                              self.goal.copy()])
+                              goal_pos])
        return obs
    def sample_context(self):
--- a/setup.py
+++ b/setup.py
@ -7,7 +7,7 @@ setup(
    install_requires=[
        'gym',
        'PyQt5',
-        'matplotlib',
+        #'matplotlib',
        #'mp_env_api @ git+https://github.com/ALRhub/motion_primitive_env_api.git',
 #         'mp_env_api @ git+ssh://git@github.com/ALRhub/motion_primitive_env_api.git',
        'mujoco-py<2.1,>=2.0',