support for contexts, policy classes, pd controller example, breaking changes etc

2021-02-11 10:49:57 +01:00 · 2021-02-11 10:49:57 +01:00 · c81378b9e7
commit c81378b9e7
parent 07195fa2dc
9 changed files with 807 additions and 262 deletions
--- a/alr_envs/mujoco/alr_mujoco_env.py
+++ b/alr_envs/mujoco/alr_mujoco_env.py
@ -0,0 +1,247 @@
 from collections import OrderedDict
 import os
 from gym import error, spaces
 from gym.utils import seeding
 import numpy as np
 from os import path
 import gym
 try:
    import mujoco_py
 except ImportError as e:
    raise error.DependencyNotInstalled("{}. (HINT: you need to install mujoco_py, and also perform the setup instructions here: https://github.com/openai/mujoco-py/.)".format(e))
 DEFAULT_SIZE = 500
 def convert_observation_to_space(observation):
    if isinstance(observation, dict):
        space = spaces.Dict(OrderedDict([
            (key, convert_observation_to_space(value))
            for key, value in observation.items()
        ]))
    elif isinstance(observation, np.ndarray):
        low = np.full(observation.shape, -float('inf'), dtype=np.float32)
        high = np.full(observation.shape, float('inf'), dtype=np.float32)
        space = spaces.Box(low, high, dtype=observation.dtype)
    else:
        raise NotImplementedError(type(observation), observation)
    return space
 class AlrMujocoEnv(gym.Env):
    """
    Superclass for all MuJoCo environments.
    """
    def __init__(self, model_path, n_substeps, apply_gravity_comp=True):
        """
        Args:
            model_path: path to xml file
            n_substeps: how many steps mujoco does per call to env.step
            use_servo: use actuator defined in xml, use False for direct torque control
        """
        if model_path.startswith("/"):
            fullpath = model_path
        else:
            fullpath = os.path.join(os.path.dirname(__file__), "assets", model_path)
        if not path.exists(fullpath):
            raise IOError("File %s does not exist" % fullpath)
        self.n_substeps = n_substeps
        self.apply_gravity_comp = apply_gravity_comp
        self.model = mujoco_py.load_model_from_path(fullpath)
        self.sim = mujoco_py.MjSim(self.model, nsubsteps=n_substeps)
        self.data = self.sim.data
        self.viewer = None
        self._viewers = {}
        self.metadata = {
            'render.modes': ['human', 'rgb_array', 'depth_array'],
            'video.frames_per_second': int(np.round(1.0 / self.dt))
        }
        self.init_qpos = self.sim.data.qpos.ravel().copy()
        self.init_qvel = self.sim.data.qvel.ravel().copy()
        self._set_action_space()
        # action = self.action_space.sample()
        # observation, _reward, done, _info = self.step(action)
        # assert not done
        observation = self.reset()
        self._set_observation_space(observation)
        self.seed()
    @property
    def current_pos(self):
        """
        By default returns the joint positions of all simulated objects. May be overriden in subclass.
        """
        return self.sim.data.qpos
    @property
    def current_vel(self):
        """
        By default returns the joint velocities of all simulated objects. May be overriden in subclass.
        """
        return self.sim.data.qvel
    def extend_des_pos(self, des_pos):
        """
        In a simplified environment, the actions may only control a subset of all the joints.
        Extend the trajectory to match the environments full action space
        Args:
            des_pos:
        Returns:
        """
        pass
    def extend_des_vel(self, des_vel):
        pass
    def _set_action_space(self):
        bounds = self.model.actuator_ctrlrange.copy().astype(np.float32)
        low, high = bounds.T
        self.action_space = spaces.Box(low=low, high=high, dtype=np.float32)
        return self.action_space
    def _set_observation_space(self, observation):
        self.observation_space = convert_observation_to_space(observation)
        return self.observation_space
    def seed(self, seed=None):
        self.np_random, seed = seeding.np_random(seed)
        return [seed]
    # methods to override:
    # ----------------------------
    def configure(self, *args, **kwargs):
        """
        Helper method to set certain environment properties such as contexts in contextual environments since reset()
        doesn't take arguments. Should be called before/after reset(). TODO: before or after?
        """
        pass
    def reset_model(self):
        """
        Reset the robot degrees of freedom (qpos and qvel).
        Implement this in each subclass.
        """
        raise NotImplementedError
    def viewer_setup(self):
        """
        This method is called when the viewer is initialized.
        Optionally implement this method, if you need to tinker with camera position
        and so forth.
        """
        pass
    # -----------------------------
    def reset(self):
        self.sim.reset()
        ob = self.reset_model()
        return ob
    def set_state(self, qpos, qvel):
        assert qpos.shape == (self.model.nq,) and qvel.shape == (self.model.nv,)
        old_state = self.sim.get_state()
        new_state = mujoco_py.MjSimState(old_state.time, qpos, qvel,
                                         old_state.act, old_state.udd_state)
        self.sim.set_state(new_state)
        self.sim.forward()
    @property
    def dt(self):
        return self.model.opt.timestep * self.n_substeps
    def do_simulation(self, ctrl):
        """
        Additionally returns whether there was an error while stepping the simulation
        """
        error_in_sim = False
        num_actuations = len(ctrl)
        if self.apply_gravity_comp:
            self.sim.data.ctrl[:num_actuations] = ctrl + self.sim.data.qfrc_bias[:num_actuations].copy() / self.model.actuator_gear[:, 0]
        else:
            self.sim.data.ctrl[:num_actuations] = ctrl
        try:
            self.sim.step()
        except mujoco_py.builder.MujocoException as e:
            error_in_sim = True
        return error_in_sim
    def render(self,
               mode='human',
               width=DEFAULT_SIZE,
               height=DEFAULT_SIZE,
               camera_id=None,
               camera_name=None):
        if mode == 'rgb_array' or mode == 'depth_array':
            if camera_id is not None and camera_name is not None:
                raise ValueError("Both `camera_id` and `camera_name` cannot be"
                                 " specified at the same time.")
            no_camera_specified = camera_name is None and camera_id is None
            if no_camera_specified:
                camera_name = 'track'
            if camera_id is None and camera_name in self.model._camera_name2id:
                camera_id = self.model.camera_name2id(camera_name)
            self._get_viewer(mode).render(width, height, camera_id=camera_id)
        if mode == 'rgb_array':
            # window size used for old mujoco-py:
            data = self._get_viewer(mode).read_pixels(width, height, depth=False)
            # original image is upside-down, so flip it
            return data[::-1, :, :]
        elif mode == 'depth_array':
            self._get_viewer(mode).render(width, height)
            # window size used for old mujoco-py:
            # Extract depth part of the read_pixels() tuple
            data = self._get_viewer(mode).read_pixels(width, height, depth=True)[1]
            # original image is upside-down, so flip it
            return data[::-1, :]
        elif mode == 'human':
            self._get_viewer(mode).render()
    def close(self):
        if self.viewer is not None:
            # self.viewer.finish()
            self.viewer = None
            self._viewers = {}
    def _get_viewer(self, mode):
        self.viewer = self._viewers.get(mode)
        if self.viewer is None:
            if mode == 'human':
                self.viewer = mujoco_py.MjViewer(self.sim)
            elif mode == 'rgb_array' or mode == 'depth_array':
                self.viewer = mujoco_py.MjRenderContextOffscreen(self.sim, -1)
            self.viewer_setup()
            self._viewers[mode] = self.viewer
        return self.viewer
    def get_body_com(self, body_name):
        return self.data.get_body_xpos(body_name)
    def state_vector(self):
        return np.concatenate([
            self.sim.data.qpos.flat,
            self.sim.data.qvel.flat
        ])
--- a/alr_envs/mujoco/alr_reward_fct.py
+++ b/alr_envs/mujoco/alr_reward_fct.py
@ -0,0 +1,21 @@
 class AlrReward:
    """
    A base class for non-Markovian reward functions which may need trajectory information to calculate an episodic
    reward. Call the methods in reset() and step() of the environment.
    """
    # methods to override:
    # ----------------------------
    def reset(self, *args, **kwargs):
        """
        Reset the reward function, empty state buffers before an episode, set contexts that influence reward, etc.
        """
        raise NotImplementedError
    def compute_reward(self, *args, **kwargs):
        """
        Returns: Useful things to return are reward values, success flags or crash flags
        """
        raise NotImplementedError
--- a/alr_envs/mujoco/ball_in_a_cup/assets/biac_base.xml
+++ b/alr_envs/mujoco/ball_in_a_cup/assets/biac_base.xml
@ -0,0 +1,360 @@
 <mujoco model="wam(v1.31)">
    <compiler angle="radian" meshdir="meshes/" />
    <option timestep="0.0005" integrator="Euler" />
    <size njmax="500" nconmax="100" />
    <default class="main">
        <joint limited="true" frictionloss="0.001" />
        <default class="viz">
            <geom type="mesh" contype="0" conaffinity="0" group="1" rgba="0.7 0.7 0.7 1" />
        </default>
        <default class="col">
            <geom type="mesh" contype="0" rgba="0.5 0.6 0.7 1" />
        </default>
    </default>
    <asset>
        <texture type="2d" name="groundplane" builtin="checker" mark="edge" rgb1="0.25 0.26 0.25" rgb2="0.22 0.22 0.22" markrgb="0.3 0.3 0.3" width="100" height="100" />
        <material name="MatGnd" texture="groundplane" texrepeat="5 5" specular="1" shininess="0.3" reflectance="1e-05" />
        <mesh name="base_link_fine" file="base_link_fine.stl" />
        <mesh name="base_link_convex" file="base_link_convex.stl" />
        <mesh name="shoulder_link_fine" file="shoulder_link_fine.stl" />
        <mesh name="shoulder_link_convex_decomposition_p1" file="shoulder_link_convex_decomposition_p1.stl" />
        <mesh name="shoulder_link_convex_decomposition_p2" file="shoulder_link_convex_decomposition_p2.stl" />
        <mesh name="shoulder_link_convex_decomposition_p3" file="shoulder_link_convex_decomposition_p3.stl" />
        <mesh name="shoulder_pitch_link_fine" file="shoulder_pitch_link_fine.stl" />
        <mesh name="shoulder_pitch_link_convex" file="shoulder_pitch_link_convex.stl" />
        <mesh name="upper_arm_link_fine" file="upper_arm_link_fine.stl" />
        <mesh name="upper_arm_link_convex_decomposition_p1" file="upper_arm_link_convex_decomposition_p1.stl" />
        <mesh name="upper_arm_link_convex_decomposition_p2" file="upper_arm_link_convex_decomposition_p2.stl" />
        <mesh name="elbow_link_fine" file="elbow_link_fine.stl" />
        <mesh name="elbow_link_convex" file="elbow_link_convex.stl" />
        <mesh name="forearm_link_fine" file="forearm_link_fine.stl" />
        <mesh name="forearm_link_convex_decomposition_p1" file="forearm_link_convex_decomposition_p1.stl" />
        <mesh name="forearm_link_convex_decomposition_p2" file="forearm_link_convex_decomposition_p2.stl" />
        <mesh name="wrist_yaw_link_fine" file="wrist_yaw_link_fine.stl" />
        <mesh name="wrist_yaw_link_convex_decomposition_p1" file="wrist_yaw_link_convex_decomposition_p1.stl" />
        <mesh name="wrist_yaw_link_convex_decomposition_p2" file="wrist_yaw_link_convex_decomposition_p2.stl" />
        <mesh name="wrist_pitch_link_fine" file="wrist_pitch_link_fine.stl" />
        <mesh name="wrist_pitch_link_convex_decomposition_p1" file="wrist_pitch_link_convex_decomposition_p1.stl" />
        <mesh name="wrist_pitch_link_convex_decomposition_p2" file="wrist_pitch_link_convex_decomposition_p2.stl" />
        <mesh name="wrist_pitch_link_convex_decomposition_p3" file="wrist_pitch_link_convex_decomposition_p3.stl" />
        <mesh name="wrist_palm_link_fine" file="wrist_palm_link_fine.stl" />
        <mesh name="wrist_palm_link_convex" file="wrist_palm_link_convex.stl" />
        <mesh name="cup1" file="cup_split1.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup2" file="cup_split2.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup3" file="cup_split3.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup4" file="cup_split4.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup5" file="cup_split5.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup6" file="cup_split6.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup7" file="cup_split7.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup8" file="cup_split8.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup9" file="cup_split9.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup10" file="cup_split10.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup11" file="cup_split11.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup12" file="cup_split12.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup13" file="cup_split13.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup14" file="cup_split14.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup15" file="cup_split15.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup16" file="cup_split16.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup17" file="cup_split17.stl" scale="0.001 0.001 0.001" />
        <mesh name="cup18" file="cup_split18.stl" scale="0.001 0.001 0.001" />
    </asset>
    <worldbody>
        <geom name="ground" size="1.5 2 1" type="plane" material="MatGnd" />
        <light pos="0.1 0.2 1.3" dir="-0.0758098 -0.32162 -0.985527" directional="true" cutoff="60" exponent="1" diffuse="1 1 1" specular="0.1 0.1 0.1" />
        <body name="wam/base_link" pos="0 0 0.6">
            <inertial pos="6.93764e-06 0.0542887 0.076438" quat="0.496481 0.503509 -0.503703 0.496255" mass="27.5544" diaginertia="0.432537 0.318732 0.219528" />
            <geom class="viz" quat="0.707107 0 0 -0.707107" mesh="base_link_fine" />
            <geom class="col" quat="0.707107 0 0 -0.707107" mesh="base_link_convex" />
            <body name="wam/shoulder_yaw_link" pos="0 0 0.16" quat="0.707107 0 0 -0.707107">
                <inertial pos="-0.00443422 -0.00066489 -0.12189" quat="0.999995 0.000984795 0.00270132 0.00136071" mass="10.7677" diaginertia="0.507411 0.462983 0.113271" />
                <joint name="wam/base_yaw_joint" pos="0 0 0" axis="0 0 1" range="-2.6 2.6" />
                <geom class="viz" pos="0 0 0.186" mesh="shoulder_link_fine" />
                <geom class="col" pos="0 0 0.186" mesh="shoulder_link_convex_decomposition_p1" />
                <geom class="col" pos="0 0 0.186" mesh="shoulder_link_convex_decomposition_p2" />
                <geom class="col" pos="0 0 0.186" mesh="shoulder_link_convex_decomposition_p3" />
                <body name="wam/shoulder_pitch_link" pos="0 0 0.184" quat="0.707107 -0.707107 0 0">
                    <inertial pos="-0.00236983 -0.0154211 0.0310561" quat="0.961781 -0.272983 0.0167269 0.0133385" mass="3.87494" diaginertia="0.0214207 0.0167101 0.0126465" />
                    <joint name="wam/shoulder_pitch_joint" pos="0 0 0" axis="0 0 1" range="-1.985 1.985" />
                    <geom class="viz" mesh="shoulder_pitch_link_fine" />
                    <geom class="col" mesh="shoulder_pitch_link_convex" />
                    <body name="wam/upper_arm_link" pos="0 -0.505 0" quat="0.707107 0.707107 0 0">
                        <inertial pos="-0.0382586 3.309e-05 -0.207508" quat="0.705455 0.0381914 0.0383402 0.706686" mass="1.80228" diaginertia="0.0665697 0.0634285 0.00622701" />
                        <joint name="wam/shoulder_yaw_joint" pos="0 0 0" axis="0 0 1" range="-2.8 2.8" />
                        <geom class="viz" pos="0 0 -0.505" mesh="upper_arm_link_fine" />
                        <geom class="col" pos="0 0 -0.505" mesh="upper_arm_link_convex_decomposition_p1" />
                        <geom class="col" pos="0 0 -0.505" mesh="upper_arm_link_convex_decomposition_p2" />
                        <body name="wam/forearm_link" pos="0.045 0 0.045" quat="0.707107 -0.707107 0 0">
                            <inertial pos="0.00498512 -0.132717 -0.00022942" quat="0.546303 0.447151 -0.548676 0.447842" mass="2.40017" diaginertia="0.0196896 0.0152225 0.00749914" />
                            <joint name="wam/elbow_pitch_joint" pos="0 0 0" axis="0 0 1" range="-0.9 3.14159" />
                            <geom class="viz" mesh="elbow_link_fine" />
                            <geom class="col" mesh="elbow_link_convex" />
                            <geom class="viz" pos="-0.045 -0.073 0" quat="0.707388 0.706825 0 0" mesh="forearm_link_fine" />
                            <geom class="col" pos="-0.045 -0.073 0" quat="0.707388 0.706825 0 0" mesh="forearm_link_convex_decomposition_p1" name="forearm_link_convex_decomposition_p1_geom" />
                            <geom class="col" pos="-0.045 -0.073 0" quat="0.707388 0.706825 0 0" mesh="forearm_link_convex_decomposition_p2" name="forearm_link_convex_decomposition_p2_geom" />
                            <body name="wam/wrist_yaw_link" pos="-0.045 0 0" quat="0.707107 0.707107 0 0">
                                <inertial pos="8.921e-05 0.00435824 -0.00511217" quat="0.708528 -0.000120667 0.000107481 0.705683" mass="0.12376" diaginertia="0.0112011 0.0111887 7.58188e-05" />
                                <joint name="wam/wrist_yaw_joint" pos="0 0 0" axis="0 0 1" range="-4.55 1.25" />
                                <geom class="viz" pos="0 0 0.3" mesh="wrist_yaw_link_fine" />
                                <geom class="col" pos="0 0 0.3" mesh="wrist_yaw_link_convex_decomposition_p1" name="wrist_yaw_link_convex_decomposition_p1_geom" />
                                <geom class="col" pos="0 0 0.3" mesh="wrist_yaw_link_convex_decomposition_p2" name="wrist_yaw_link_convex_decomposition_p2_geom" />
                                <body name="wam/wrist_pitch_link" pos="0 0 0.3" quat="0.707107 -0.707107 0 0">
                                    <inertial pos="-0.00012262 -0.0246834 -0.0170319" quat="0.994687 -0.102891 0.000824211 -0.00336105" mass="0.417974" diaginertia="0.000555166 0.000463174 0.00023407" />
                                    <joint name="wam/wrist_pitch_joint" pos="0 0 0" axis="0 0 1" range="-1.5707 1.5707" />
                                    <geom class="viz" mesh="wrist_pitch_link_fine" />
                                    <geom class="col" mesh="wrist_pitch_link_convex_decomposition_p1" name="wrist_pitch_link_convex_decomposition_p1_geom" />
                                    <geom class="col" mesh="wrist_pitch_link_convex_decomposition_p2" name="wrist_pitch_link_convex_decomposition_p2_geom" />
                                    <geom class="col" mesh="wrist_pitch_link_convex_decomposition_p3" name="wrist_pitch_link_convex_decomposition_p3_geom" />
                                    <body name="wam/wrist_palm_link" pos="0 -0.06 0" quat="0.707107 0.707107 0 0">
                                        <inertial pos="-7.974e-05 -0.00323552 -0.00016313" quat="0.594752 0.382453 0.382453 0.594752" mass="0.0686475" diaginertia="7.408e-05 3.81466e-05 3.76434e-05" />
                                        <joint name="wam/palm_yaw_joint" pos="0 0 0" axis="0 0 1" range="-2.7 2.7" />
                                        <geom class="viz" pos="0 0 -0.06" mesh="wrist_palm_link_fine" />
                                        <geom class="col" pos="0 0 -0.06" mesh="wrist_palm_link_convex" name="wrist_palm_link_convex_geom" />
                                        <body name="cup" pos="0 0 0" quat="-0.000203673 0 0 1">
                                            <inertial pos="-3.75236e-10 8.27811e-05 0.0947015" quat="0.999945 -0.0104888 0 0" mass="0.132" diaginertia="0.000285643 0.000270485 9.65696e-05" />
                                            <geom name="cup_geom1" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup1" />
                                            <geom name="cup_geom2" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup2" />
                                            <geom name="cup_geom3" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup3" />
                                            <geom name="cup_geom4" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup4" />
                                            <geom name="cup_geom5" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup5" />
                                            <geom name="cup_geom6" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup6" />
                                            <geom name="cup_geom7" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup7" />
                                            <geom name="cup_geom8" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup8" />
                                            <geom name="cup_geom9" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup9" />
                                            <geom name="cup_geom10" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup10" />
                                            <geom name="cup_base" pos="0 -0.035 0.1165" euler="-1.57 0 0" type="cylinder" size="0.038 0.0045" solref="-10000 -100"/>
 <!--                                            <geom name="cup_base_contact" pos="0 -0.025 0.1165" euler="-1.57 0 0" type="cylinder" size="0.03 0.0005" solref="-10000 -100" rgba="0 0 255 1"/>-->
                                            <geom name="cup_base_contact" pos="0 -0.005 0.1165" euler="-1.57 0 0" type="cylinder" size="0.02 0.0005" solref="-10000 -100" rgba="0 0 255 1"/>
 <!--                                            <geom name="cup_geom11" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup11" />-->
 <!--                                            <geom name="cup_geom12" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup12" />-->
 <!--                                            <geom name="cup_geom13" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup13" />-->
 <!--                                            <geom name="cup_geom14" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup14" />-->
                                            <geom name="cup_geom15" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup15" />
                                            <geom name="cup_geom16" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup16" />
                                            <geom name="cup_geom17" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup17" />
                                            <geom name="cup_geom18" pos="0 0.05 0.055" euler="-1.57 0 0" solref="-10000 -100" type="mesh" mesh="cup18" />
                                            <site name="cup_goal" pos="0 0.05 0.1165" rgba="255 0 0 1"/>
                                            <site name="cup_goal_final" pos="0 -0.025 0.1165" rgba="0 255 0 1"/>
                                            <body name="B0" pos="0 -0.045 0.1165" quat="0.707388 0 0 -0.706825">
                                                <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                <geom name="G0" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                <body name="B1" pos="0.0107 0 0">
                                                    <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                    <joint name="J0_1" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                    <joint name="J1_1" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                    <geom name="G1" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                    <body name="B2" pos="0.0107 0 0">
                                                        <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                        <joint name="J0_2" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                        <joint name="J1_2" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                        <geom name="G2" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                        <body name="B3" pos="0.0107 0 0">
                                                            <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                            <joint name="J0_3" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                            <joint name="J1_3" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                            <geom name="G3" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                            <body name="B4" pos="0.0107 0 0">
                                                                <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                <joint name="J0_4" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                <joint name="J1_4" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                <geom name="G4" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                <body name="B5" pos="0.0107 0 0">
                                                                    <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                    <joint name="J0_5" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                    <joint name="J1_5" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                    <geom name="G5" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                    <body name="B6" pos="0.0107 0 0">
                                                                        <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                        <joint name="J0_6" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                        <joint name="J1_6" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                        <geom name="G6" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                        <body name="B7" pos="0.0107 0 0">
                                                                            <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                            <joint name="J0_7" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                            <joint name="J1_7" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                            <geom name="G7" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                            <body name="B8" pos="0.0107 0 0">
                                                                                <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                <joint name="J0_8" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                <joint name="J1_8" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                <geom name="G8" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                <body name="B9" pos="0.0107 0 0">
                                                                                    <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                    <joint name="J0_9" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                    <joint name="J1_9" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                    <geom name="G9" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                    <body name="B10" pos="0.0107 0 0">
                                                                                        <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                        <joint name="J0_10" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                        <joint name="J1_10" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                        <geom name="G10" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                        <body name="B11" pos="0.0107 0 0">
                                                                                            <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                            <joint name="J0_11" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                            <joint name="J1_11" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                            <geom name="G11" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                            <body name="B12" pos="0.0107 0 0">
                                                                                                <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                <joint name="J0_12" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                <joint name="J1_12" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                <geom name="G12" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                <body name="B13" pos="0.0107 0 0">
                                                                                                    <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                    <joint name="J0_13" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                    <joint name="J1_13" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                    <geom name="G13" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                    <body name="B14" pos="0.0107 0 0">
                                                                                                        <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                        <joint name="J0_14" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                        <joint name="J1_14" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                        <geom name="G14" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                        <body name="B15" pos="0.0107 0 0">
                                                                                                            <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                            <joint name="J0_15" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                            <joint name="J1_15" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                            <geom name="G15" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                            <body name="B16" pos="0.0107 0 0">
                                                                                                                <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                <joint name="J0_16" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                <joint name="J1_16" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                <geom name="G16" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                <body name="B17" pos="0.0107 0 0">
                                                                                                                    <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                    <joint name="J0_17" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                    <joint name="J1_17" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                    <geom name="G17" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                    <body name="B18" pos="0.0107 0 0">
                                                                                                                        <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                        <joint name="J0_18" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                        <joint name="J1_18" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                        <geom name="G18" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                        <body name="B19" pos="0.0107 0 0">
                                                                                                                            <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                            <joint name="J0_19" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                            <joint name="J1_19" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                            <geom name="G19" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                            <body name="B20" pos="0.0107 0 0">
                                                                                                                                <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                                <joint name="J0_20" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                <joint name="J1_20" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                <geom name="G20" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                                <body name="B21" pos="0.0107 0 0">
                                                                                                                                    <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                                    <joint name="J0_21" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                    <joint name="J1_21" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                    <geom name="G21" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                                    <body name="B22" pos="0.0107 0 0">
                                                                                                                                        <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                                        <joint name="J0_22" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                        <joint name="J1_22" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                        <geom name="G22" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                                        <body name="B23" pos="0.0107 0 0">
                                                                                                                                            <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                                            <joint name="J0_23" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                            <joint name="J1_23" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                            <geom name="G23" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                                            <body name="B24" pos="0.0107 0 0">
                                                                                                                                                <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                                                <joint name="J0_24" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                                <joint name="J1_24" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                                <geom name="G24" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                                                <body name="B25" pos="0.0107 0 0">
                                                                                                                                                    <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                                                    <joint name="J0_25" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                                    <joint name="J1_25" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                                    <geom name="G25" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                                                    <body name="B26" pos="0.0107 0 0">
                                                                                                                                                        <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                                                        <joint name="J0_26" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                                        <joint name="J1_26" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                                        <geom name="G26" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                                                        <body name="B27" pos="0.0107 0 0">
                                                                                                                                                            <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                                                            <joint name="J0_27" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                                            <joint name="J1_27" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                                            <geom name="G27" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                                                            <body name="B28" pos="0.0107 0 0">
                                                                                                                                                                <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                                                                <joint name="J0_28" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                                                <joint name="J1_28" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                                                <geom name="G28" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                                                                <body name="B29" pos="0.0107 0 0">
                                                                                                                                                                    <inertial pos="0 0 0" quat="0.707107 0 0.707107 0" mass="7.4927e-05" diaginertia="5.87e-10 5.87e-10 3.74635e-11" />
                                                                                                                                                                    <joint name="J0_29" pos="-0.00535 0 0" axis="0 1 0" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                                                    <joint name="J1_29" pos="-0.00535 0 0" axis="0 0 1" group="3" limited="false" damping="0.0001" frictionloss="0" />
                                                                                                                                                                    <geom name="G29" size="0.001 0.00427" quat="0.707107 0 0.707107 0" type="capsule" rgba="0.8 0.2 0.1 1" />
                                                                                                                                                                    <body name="ball">
                                                                                                                                                                        <geom name="ball_geom" type="sphere" size="0.02" mass="0.021" rgba="0.8 0.2 0.1 1"/>
                                                                                                                                                                    </body>
                                                                                                                                                                </body>
                                                                                                                                                            </body>
                                                                                                                                                        </body>
                                                                                                                                                    </body>
                                                                                                                                                </body>
                                                                                                                                            </body>
                                                                                                                                        </body>
                                                                                                                                    </body>
                                                                                                                                </body>
                                                                                                                            </body>
                                                                                                                        </body>
                                                                                                                    </body>
                                                                                                                </body>
                                                                                                            </body>
                                                                                                        </body>
                                                                                                    </body>
                                                                                                </body>
                                                                                            </body>
                                                                                        </body>
                                                                                    </body>
                                                                                </body>
                                                                            </body>
                                                                        </body>
                                                                    </body>
                                                                </body>
                                                            </body>
                                                        </body>
                                                    </body>
                                                </body>
                                            </body>
                                        </body>
                                    </body>
                                </body>
                            </body>
                        </body>
                    </body>
                </body>
            </body>
        </body>
        <site name="context_point" pos="0 0.05 0.1165" euler="-1.57 0 0" size="0.015" rgba="1 0 0 0.6" type="sphere"/>
        <site name="context_point1" pos="-0.5 -0.85 0.8165" euler="-1.57 0 0" size="0.015" rgba="0 1 0 0.3" type="sphere"/>
        <site name="context_point2" pos="-0.5 -0.85 1.4165" euler="-1.57 0 0" size="0.015" rgba="0 1 0 0.3" type="sphere"/>
        <site name="context_point3" pos="-0.5 -0.35 0.8165" euler="-1.57 0 0" size="0.015" rgba="0 1 0 0.3" type="sphere"/>
        <site name="context_point4" pos="-0.5 -0.35 1.4165" euler="-1.57 0 0" size="0.015" rgba="0 1 0 0.3" type="sphere"/>
        <site name="context_point5" pos="0.5 -0.85 0.8165" euler="-1.57 0 0" size="0.015" rgba="0 1 0 0.3" type="sphere"/>
        <site name="context_point6" pos="0.5 -0.85 1.4165" euler="-1.57 0 0" size="0.015" rgba="0 1 0 0.3" type="sphere"/>
        <site name="context_point7" pos="0.5 -0.35 0.8165" euler="-1.57 0 0" size="0.015" rgba="0 1 0 0.3" type="sphere"/>
        <site name="context_point8" pos="0.5 -0.35 1.4165" euler="-1.57 0 0" size="0.015" rgba="0 1 0 0.3" type="sphere"/>
        <site name="context_space" pos="0 -0.6 1.1165" euler="0 0 0" size="0.5 0.25 0.3" rgba="0 0 1 0.15" type="box"/>
        <camera name="visualization" mode="targetbody" target="wam/wrist_yaw_link" pos="1.5 -0.4 2.2"/>
        <camera name="experiment" mode="fixed" quat="0.44418059 0.41778323 0.54301123 0.57732103" pos="1.5 -0.3 1.33" />
    </worldbody>
    <actuator>
 <!--        <motor ctrllimited="true" ctrlrange="-150 150" joint="wam/base_yaw_joint"/>-->
 <!--        <motor ctrllimited="true" ctrlrange="-125 125" joint="wam/shoulder_pitch_joint"/>-->
 <!--        <motor ctrllimited="true" ctrlrange="-40 40" joint="wam/shoulder_yaw_joint"/>-->
 <!--        <motor ctrllimited="true" ctrlrange="-60 60" joint="wam/elbow_pitch_joint"/>-->
 <!--        <motor ctrllimited="true" ctrlrange="-5 5" joint="wam/wrist_yaw_joint"/>-->
 <!--        <motor ctrllimited="true" ctrlrange="-5 5" joint="wam/wrist_pitch_joint"/>-->
 <!--        <motor ctrllimited="true" ctrlrange="-2 2" joint="wam/palm_yaw_joint"/>-->
        <motor ctrllimited="true" ctrlrange="-1.0 1.0" gear="150.0" joint="wam/base_yaw_joint"/>
        <motor ctrllimited="true" ctrlrange="-1.0 1.0" gear="125.0" joint="wam/shoulder_pitch_joint"/>
        <motor ctrllimited="true" ctrlrange="-1.0 1.0" gear="40.0" joint="wam/shoulder_yaw_joint"/>
        <motor ctrllimited="true" ctrlrange="-1.0 1.0" gear="60.0" joint="wam/elbow_pitch_joint"/>
        <motor ctrllimited="true" ctrlrange="-1.0 1.0" gear="5.0" joint="wam/wrist_yaw_joint"/>
        <motor ctrllimited="true" ctrlrange="-1.0 1.0" gear="5.0" joint="wam/wrist_pitch_joint"/>
        <motor ctrllimited="true" ctrlrange="-1.0 1.0" gear="2.0" joint="wam/palm_yaw_joint"/>
    </actuator>
 </mujoco>
--- a/alr_envs/mujoco/ball_in_a_cup/ball_in_a_cup_reward.py
+++ b/alr_envs/mujoco/ball_in_a_cup/ball_in_a_cup_reward.py
@ -1,7 +1,8 @@
 import numpy as np
 from alr_envs.mujoco import alr_reward_fct
-class BallInACupReward:
+class BallInACupReward(alr_reward_fct.AlrReward):
    def __init__(self, sim_time):
        self.sim_time = sim_time
@ -14,7 +15,6 @@ class BallInACupReward:
                                  "forearm_link_convex_decomposition_p1_geom",
                                  "forearm_link_convex_decomposition_p2_geom"]
        self.ctxt_id = None
        self.ball_id = None
        self.ball_collision_id = None
        self.goal_id = None
@ -34,8 +34,7 @@ class BallInACupReward:
        self.dists_final = []
        self.costs = []
-    def compute_reward(self, action, sim, step):
+    def compute_reward(self, action, sim, step, context=None):
        self.ctxt_id = sim.model._site_name2id['context_point']
        self.ball_id = sim.model._body_name2id["ball"]
        self.ball_collision_id = sim.model._geom_name2id["ball_geom"]
        self.goal_id = sim.model._site_name2id["cup_goal"]
@ -50,59 +49,26 @@ class BallInACupReward:
        goal_final_pos = sim.data.site_xpos[self.goal_final_id]
        self.dists.append(np.linalg.norm(goal_pos - ball_pos))
        self.dists_final.append(np.linalg.norm(goal_final_pos - ball_pos))
        # dists_ctxt.append(np.linalg.norm(ball_pos - ctxt))
        self.ball_traj[step, :] = ball_pos
        if self.check_collision(sim):
            return -1000, False, True
        # self._get_cost(ball_pos, goal_pos, goal_final_pos, action,
        #                sim.data.get_site_xpos('context_point').copy(), step)
        # min_dist = np.min(self.dists)
        # dist_final = self.dists_final[-1]
        action_cost = np.sum(np.square(action))
        # cost = self.get_stage_wise_cost(ball_in_cup, min_dist, self.dists_final[-1])  # , self.dists_ctxt[-1])
        if step == self.sim_time - 1:
            min_dist = np.min(self.dists)
            dist_final = self.dists_final[-1]
            cost = 0.5 * min_dist + 0.5 * dist_final
-            # cost = 3 + 2 * (0.5 * min_dist ** 2 + 0.5 * dist_final ** 2)
+            reward = np.exp(-2 * cost) - 1e-5 * action_cost
-            reward = np.exp(-2 * min_dist) - 1e-5 * action_cost
+            success = dist_final < 0.05 and ball_in_cup
            success = dist_final < 0.05 and min_dist < 0.05
        else:
            cost = 0
            reward = - 1e-5 * action_cost
            success = False
        # action_cost = np.mean(np.sum(np.square(torques), axis=1), axis=0)
        return reward, success, False
    def get_stage_wise_cost(self, ball_in_cup, min_dist, dist_final):  #, dist_to_ctxt):
        # stop_sim = False
        cost = 3 + 2 * (0.5 * min_dist ** 2 + 0.5 * dist_final ** 2)
        # if not ball_in_cup:
        #     # cost = 3 + 2*(0.5 * min_dist + 0.5 * dist_final)
        #     cost = 3 + 2*(0.5 * min_dist**2 + 0.5 * dist_final**2)
        # else:
        #     # cost = 2*dist_to_ctxt
        #     cost = 2*dist_to_ctxt**2
        #     stop_sim = True
        #     # print(dist_to_ctxt-0.02)
        #     print('Context Distance:', dist_to_ctxt)
        return cost
    def _get_cost(self, ball_pos, goal_pos, goal_pos_final, u, ctxt, t):
        cost = 0
        if t == self.sim_time*0.8:
            dist = 0.5*np.linalg.norm(goal_pos-ball_pos)**2 + 0.5*np.linalg.norm(goal_pos_final-ball_pos)**2
            # dist_ctxt = np.linalg.norm(ctxt-goal_pos)**2
            cost = dist  # +dist_ctxt
        return cost
    def check_ball_in_cup(self, sim, ball_collision_id):
        cup_base_collision_id = sim.model._geom_name2id["cup_base_contact"]
        for coni in range(0, sim.data.ncon):
--- a/alr_envs/mujoco/ball_in_a_cup/ball_in_a_cup_simple.py
+++ b/alr_envs/mujoco/ball_in_a_cup/ball_in_a_cup_simple.py
@ -1,38 +1,41 @@
-from gym.envs.mujoco import mujoco_env
+from alr_envs.mujoco import alr_mujoco_env
 from gym import utils, spaces
 import os
 import numpy as np
 from alr_envs.mujoco.ball_in_a_cup.ball_in_a_cup_reward import BallInACupReward
 import mujoco_py
-class ALRBallInACupEnv(mujoco_env.MujocoEnv, utils.EzPickle):
+class ALRBallInACupEnv(alr_mujoco_env.AlrMujocoEnv, utils.EzPickle):
-    def __init__(self, pd_control=True):
+    def __init__(self, reward_function=None):
        self._steps = 0
        self.pd_control = pd_control
        self.xml_path = os.path.join(os.path.dirname(os.path.abspath(__file__)), "assets",
-                                     "ball-in-a-cup_base" + ".xml")
+                                     "biac_base" + ".xml")
        self.sim_time = 8  # seconds
        self.sim_steps = int(self.sim_time / (0.0005 * 4))  # circular dependency.. sim.dt <-> mujocoenv init <-> reward fct
-        self.reward_function = BallInACupReward(self.sim_steps)
+        self.reward_function = reward_function(self.sim_steps)
        self.start_pos = np.array([0.0, 0.58760536, 0.0, 1.36004913, 0.0, -0.32072943, -1.57])
        self.start_vel = np.zeros(7)
-        # self.start_pos = np.array([0.58760536, 1.36004913, -0.32072943])
+
        self._q_pos = []
        self._q_vel = []
        # self.weight_matrix_scale = 50
-        self.p_gains = 1*np.array([200, 300, 100, 100, 10, 10, 2.5])
+        self.max_ctrl = np.array([150., 125., 40., 60., 5., 5., 2.])
-        self.d_gains = 1*np.array([7, 15, 5, 2.5, 0.3, 0.3, 0.05])
+        self.p_gains = 1 / self.max_ctrl * np.array([200, 300, 100, 100, 10, 10, 2.5])
        self.d_gains = 1 / self.max_ctrl * np.array([7, 15, 5, 2.5, 0.3, 0.3, 0.05])
        self.j_min = np.array([-2.6, -1.985, -2.8, -0.9, -4.55, -1.5707, -2.7])
        self.j_max = np.array([2.6, 1.985, 2.8, 3.14159, 1.25, 1.5707, 2.7])
        self.context = None
        utils.EzPickle.__init__(self)
-        mujoco_env.MujocoEnv.__init__(self, os.path.join(os.path.dirname(__file__), "assets", "ball-in-a-cup_base.xml"),
+        alr_mujoco_env.AlrMujocoEnv.__init__(self,
-                                      frame_skip=4)
+                                             self.xml_path,
                                             apply_gravity_comp=True,
                                             n_substeps=4)
    @property
    def current_pos(self):
@ -42,96 +45,68 @@ class ALRBallInACupEnv(mujoco_env.MujocoEnv, utils.EzPickle):
    def current_vel(self):
        return self.sim.data.qvel[0:7].copy()
    def configure(self, context):
        self.context = context
    def reset_model(self):
        init_pos_all = self.init_qpos.copy()
        init_pos_robot = self.start_pos
        init_vel = np.zeros_like(init_pos_all)
        ball_id = self.sim.model._body_name2id["ball"]
        goal_final_id = self.sim.model._site_name2id["cup_goal_final"]
-        # self.set_state(start_pos, start_vel)
+
        self._steps = 0
        self.reward_function.reset()
        self._q_pos = []
        self._q_vel = []
        start_pos = init_pos_all
        start_pos[0:7] = init_pos_robot
        self.set_state(start_pos, init_vel)
        # Reset the system
-        self.sim.data.qpos[:] = init_pos_all
+        # self.sim.data.qpos[:] = init_pos_all
-        self.sim.data.qvel[:] = init_vel
+        # self.sim.data.qvel[:] = init_vel
-        self.sim.data.qpos[0:7] = init_pos_robot
+        # self.sim.data.qpos[0:7] = init_pos_robot
        #
        # self.sim.step()
        #
        # self.sim.data.qpos[:] = init_pos_all
        # self.sim.data.qvel[:] = init_vel
        # self.sim.data.qpos[0:7] = init_pos_robot
        # self.sim.data.body_xpos[ball_id, :] = np.copy(self.sim.data.site_xpos[goal_final_id, :]) - np.array([0., 0., 0.329])
        #
        # # Stabilize the system around the initial position
        # for i in range(0, 500):
        #     self.sim.data.qpos[7:] = 0.
        #     self.sim.data.qvel[7:] = 0.
        #     # self.sim.data.qpos[7] = -0.2
        #     cur_pos = self.sim.data.qpos[0:7].copy()
        #     cur_vel = self.sim.data.qvel[0:7].copy()
        #     trq = self.p_gains * (init_pos_robot - cur_pos) + self.d_gains * (np.zeros_like(init_pos_robot) - cur_vel)
        #     self.sim.data.qfrc_applied[0:7] = trq + self.sim.data.qfrc_bias[:7].copy()
        #     self.sim.step()
        #     self.render()
        #
        # for i in range(0, 500):
        #     cur_pos = self.sim.data.qpos[0:7].copy()
        #     cur_vel = self.sim.data.qvel[0:7].copy()
        #     trq = self.p_gains * (init_pos_robot - cur_pos) + self.d_gains * (np.zeros_like(init_pos_robot) - cur_vel)
        #     self.sim.data.qfrc_applied[0:7] = trq + self.sim.data.qfrc_bias[:7].copy()
        #     self.sim.step()
        #     self.render()
-        self.sim.step()
+        return self._get_obs()
        self.sim.data.qpos[:] = init_pos_all
        self.sim.data.qvel[:] = init_vel
        self.sim.data.qpos[0:7] = init_pos_robot
        self.sim.data.body_xpos[ball_id, :] = np.copy(self.sim.data.site_xpos[goal_final_id, :]) - np.array([0., 0., 0.329])
        # Stabilize the system around the initial position
        for i in range(0, 2000):
            self.sim.data.qpos[7:] = 0.
            self.sim.data.qvel[7:] = 0.
            # self.sim.data.qpos[7] = -0.2
            cur_pos = self.sim.data.qpos[0:7].copy()
            cur_vel = self.sim.data.qvel[0:7].copy()
            trq = self.p_gains * (init_pos_robot - cur_pos) + self.d_gains * (np.zeros_like(init_pos_robot) - cur_vel)
            self.sim.data.qfrc_applied[0:7] = trq + self.sim.data.qfrc_bias[:7].copy()
            self.sim.step()
            # self.render()
        for i in range(0, 2000):
            cur_pos = self.sim.data.qpos[0:7].copy()
            cur_vel = self.sim.data.qvel[0:7].copy()
            trq = self.p_gains * (init_pos_robot - cur_pos) + self.d_gains * (np.zeros_like(init_pos_robot) - cur_vel)
            self.sim.data.qfrc_applied[0:7] = trq + self.sim.data.qfrc_bias[:7].copy()
            self.sim.step()
            # self.render()
    def do_simulation(self, ctrl, n_frames):
        # cur_pos = self.sim.data.qpos[0:7].copy()
        # cur_vel = self.sim.data.qvel[0:7].copy()
        # des_pos = ctrl[:7]
        # des_vel = ctrl[7:]
        # trq = self.p_gains * (des_pos - cur_pos) + self.d_gains * (des_vel - cur_vel)
        if self.pd_control:
            self.sim.data.qfrc_applied[0:7] = ctrl + self.sim.data.qfrc_bias[:7].copy()
        else:
            self.sim.data.ctrl[:] = ctrl
        for _ in range(n_frames):
            try:
                self.sim.step()
            except mujoco_py.builder.MujocoException as e:
                print("Error in simulation: " + str(e))
                # error = True
                # Copy the current torque as if it would have been applied until the end of the trajectory
                # for i in range(k + 1, sim_time):
                #     torques.append(trq)
                return True
        return False
    def step(self, a):
        # Apply gravity compensation
        # if not np.all(self.sim.data.qfrc_applied[:7] == self.sim.data.qfrc_bias[:7]):
        #     self.sim.data.qfrc_applied[:7] = self.sim.data.qfrc_bias[:7]
        reward_dist = 0.0
        angular_vel = 0.0
        # if self._steps >= self.steps_before_reward:
        #     vec = self.get_body_com("fingertip") - self.get_body_com("target")
        #     reward_dist -= self.reward_weight * np.linalg.norm(vec)
        #     angular_vel -= np.linalg.norm(self.sim.data.qvel.flat[:self.n_links])
        reward_ctrl = - np.square(a).sum()
        # reward_balance = - self.balance_weight * np.abs(
        #     angle_normalize(np.sum(self.sim.data.qpos.flat[:self.n_links]), type="rad"))
        #
        # reward = reward_dist + reward_ctrl + angular_vel + reward_balance
        # self.do_simulation(a, self.frame_skip)
        crash = self.do_simulation(a)
        joint_cons_viol = self.check_traj_in_joint_limits()
        crash = self.do_simulation(a, self.frame_skip)
        self._q_pos.append(self.sim.data.qpos[0:7].ravel().copy())
        self._q_vel.append(self.sim.data.qvel[0:7].ravel().copy())
@ -153,17 +128,7 @@ class ALRBallInACupEnv(mujoco_env.MujocoEnv, utils.EzPickle):
    def check_traj_in_joint_limits(self):
        return any(self.current_pos > self.j_max) or any(self.current_pos < self.j_min)
-    def check_collision(self):
+    # TODO: extend observation space
        for coni in range(0, sim.data.ncon):
            con = sim.data.contact[coni]
            collision = con.geom1 in self.collision_ids and con.geom2 == self.ball_collision_id
            collision_trans = con.geom1 == self.ball_collision_id and con.geom2 in self.collision_ids
            if collision or collision_trans:
                return True
        return False
    def _get_obs(self):
        theta = self.sim.data.qpos.flat[:7]
        return np.concatenate([
@ -187,8 +152,9 @@ class ALRBallInACupEnv(mujoco_env.MujocoEnv, utils.EzPickle):
        des_vel_full[5] = des_vel[2]
        return des_vel_full
 if __name__ == "__main__":
-    env = ALRBallInACupEnv()
+    env = ALRBallInACupEnv(reward_function=BallInACupReward)
    env.reset()
    env.render()
    for i in range(4000):
@ -196,7 +162,8 @@ if __name__ == "__main__":
        # test with random actions
        # ac = 0.1 * env.action_space.sample()
        # ac = -np.array([i, i, i]) / 10000 + np.array([env.start_pos[1], env.start_pos[3], env.start_pos[5]])
-        ac = np.array([0., -0.1, 0, 0, 0, 0, 0])
+        # ac = np.array([0., -10, 0, -1, 0, 1, 0])
        ac = np.array([0.,0., 0, 0, 0, 0, 0])
        # ac[0] += np.pi/2
        obs, rew, d, info = env.step(ac)
        env.render()
--- a/alr_envs/utils/dmp_async_vec_env.py
+++ b/alr_envs/utils/dmp_async_vec_env.py
@ -24,14 +24,14 @@ class DmpAsyncVectorEnv(gym.vector.AsyncVectorEnv):
                                               n=n_samples,
                                               fn=np.zeros)
-    def __call__(self, params):
+    def __call__(self, params, contexts=None):
-        return self.rollout(params)
+        return self.rollout(params, contexts)
-    def rollout_async(self, actions):
+    def rollout_async(self, params, contexts):
        """
        Parameters
        ----------
-        actions : iterable of samples from `action_space`
+        params : iterable of samples from `action_space`
            List of actions.
        """
        self._assert_is_running()
@ -40,11 +40,17 @@ class DmpAsyncVectorEnv(gym.vector.AsyncVectorEnv):
                                          'for a pending call to `{0}` to complete.'.format(
                self._state.value), self._state.value)
-        actions = np.atleast_2d(actions)
+        params = np.atleast_2d(params)
-        split_actions = np.array_split(actions, np.minimum(len(actions), self.num_envs))
+        split_params = np.array_split(params, np.minimum(len(params), self.num_envs))
-        for pipe, action in zip(self.parent_pipes, split_actions):
+        if contexts is None:
-            pipe.send(('rollout', action))
+            split_contexts = np.array_split([None, ] * len(params), np.minimum(len(params), self.num_envs))
-        for pipe in self.parent_pipes[len(split_actions):]:
+        else:
            split_contexts = np.array_split(contexts, np.minimum(len(contexts), self.num_envs))
        assert np.all([len(p) == len(c) for p, c in zip(split_params, split_contexts)])
        for pipe, param, context in zip(self.parent_pipes, split_params, split_contexts):
            pipe.send(('rollout', (param, context)))
        for pipe in self.parent_pipes[len(split_params):]:
            pipe.send(('idle', None))
        self._state = AsyncState.WAITING_ROLLOUT
@ -98,8 +104,8 @@ class DmpAsyncVectorEnv(gym.vector.AsyncVectorEnv):
        return np.array(rewards), infos
-    def rollout(self, actions):
+    def rollout(self, actions, contexts):
-        self.rollout_async(actions)
+        self.rollout_async(actions, contexts)
        return self.rollout_wait()
@ -123,8 +129,8 @@ def _worker(index, env_fn, pipe, parent_pipe, shared_memory, error_queue):
                rewards = []
                dones = []
                infos = []
-                for d in data:
+                for p, c in zip(*data):
-                    observation, reward, done, info = env.rollout(d)
+                    observation, reward, done, info = env.rollout(p, c)
                    observations.append(observation)
                    rewards.append(reward)
                    dones.append(done)
--- a/alr_envs/utils/dmp_env_wrapper.py
+++ b/alr_envs/utils/dmp_env_wrapper.py
@ -5,7 +5,19 @@ import numpy as np
 import gym
-class DmpEnvWrapperBase(gym.Wrapper):
+def get_policy_class(policy_type):
    if policy_type == "motor":
        from alr_envs.utils.policies import PDController
        return PDController
    elif policy_type == "velocity":
        from alr_envs.utils.policies import VelController
        return VelController
    elif policy_type == "position":
        from alr_envs.utils.policies import PosController
        return PosController
 class DmpEnvWrapper(gym.Wrapper):
    def __init__(self,
                 env,
                 num_dof,
@ -17,8 +29,9 @@ class DmpEnvWrapperBase(gym.Wrapper):
                 dt=0.01,
                 learn_goal=False,
                 post_traj_time=0.,
-                 policy=None):
+                 policy_type=None,
-        super(DmpEnvWrapperBase, self).__init__(env)
+                 weights_scale=1.):
        super(DmpEnvWrapper, self).__init__(env)
        self.num_dof = num_dof
        self.num_basis = num_basis
        self.dim = num_dof * num_basis
@ -49,17 +62,19 @@ class DmpEnvWrapperBase(gym.Wrapper):
            dmp_goal_pos = final_pos
        self.dmp.set_weights(dmp_weights, dmp_goal_pos)
        self.weights_scale = weights_scale
-        self.policy = policy
+        policy_class = get_policy_class(policy_type)
        self.policy = policy_class(env)
-    def __call__(self, params):
+    def __call__(self, params, contexts=None):
        params = np.atleast_2d(params)
        observations = []
        rewards = []
        dones = []
        infos = []
-        for p in params:
+        for p, c in zip(params, contexts):
-            observation, reward, done, info = self.rollout(p)
+            observation, reward, done, info = self.rollout(p, c)
            observations.append(observation)
            rewards.append(reward)
            dones.append(done)
@ -81,82 +96,11 @@ class DmpEnvWrapperBase(gym.Wrapper):
            goal_pos = None
            weight_matrix = np.reshape(params, [self.num_basis, self.num_dof])
-        return goal_pos, weight_matrix
+        return goal_pos, weight_matrix * self.weights_scale
-    def rollout(self, params, render=False):
+    def rollout(self, params, context=None, render=False):
        """ This function generates a trajectory based on a DMP and then does the usual loop over reset and step"""
-        raise NotImplementedError
+        goal_pos, weight_matrix = self.goal_and_weights(params)
 class DmpEnvWrapperPos(DmpEnvWrapperBase):
    """
    Wrapper for gym environments which creates a trajectory in joint angle space
    """
    def rollout(self, action, render=False):
        goal_pos, weight_matrix = self.goal_and_weights(action)
        if hasattr(self.env, "weight_matrix_scale"):
            weight_matrix = weight_matrix * self.env.weight_matrix_scale
        self.dmp.set_weights(weight_matrix, goal_pos)
        trajectory, _ = self.dmp.reference_trajectory(self.t)
        if self.post_traj_steps > 0:
            trajectory = np.vstack([trajectory, np.tile(trajectory[-1, :], [self.post_traj_steps, 1])])
        self._trajectory = trajectory
        rews = []
        self.env.reset()
        for t, traj in enumerate(trajectory):
            obs, rew, done, info = self.env.step(traj)
            rews.append(rew)
            if render:
                self.env.render(mode="human")
            if done:
                break
        reward = np.sum(rews)
        return obs, reward, done, info
 class DmpEnvWrapperVel(DmpEnvWrapperBase):
    """
    Wrapper for gym environments which creates a trajectory in joint velocity space
    """
    def rollout(self, action, render=False):
        goal_pos, weight_matrix = self.goal_and_weights(action)
        if hasattr(self.env, "weight_matrix_scale"):
            weight_matrix = weight_matrix * self.env.weight_matrix_scale
        self.dmp.set_weights(weight_matrix, goal_pos)
        _, velocities = self.dmp.reference_trajectory(self.t)
        rews = []
        infos = []
        self.env.reset()
        for t, vel in enumerate(velocities):
            obs, rew, done, info = self.env.step(vel)
            rews.append(rew)
            infos.append(info)
            if render:
                self.env.render(mode="human")
            if done:
                break
        reward = np.sum(rews)
        return obs, reward, done, info
 class DmpEnvWrapperPD(DmpEnvWrapperBase):
    """
    Wrapper for gym environments which creates a trajectory in joint velocity space
    """
    def rollout(self, action, render=False):
        goal_pos, weight_matrix = self.goal_and_weights(action)
        if hasattr(self.env, "weight_matrix_scale"):
            weight_matrix = weight_matrix * self.env.weight_matrix_scale
        self.dmp.set_weights(weight_matrix, goal_pos)
@ -173,9 +117,11 @@ class DmpEnvWrapperPD(DmpEnvWrapperBase):
        infos = []
        self.env.reset()
        if context is not None:
            self.env.configure(context)
        for t, pos_vel in enumerate(zip(trajectory, velocity)):
-            ac = self.policy.get_action(self.env, pos_vel[0], pos_vel[1])
+            ac = self.policy.get_action(pos_vel[0], pos_vel[1])
            obs, rew, done, info = self.env.step(ac)
            rews.append(rew)
            infos.append(info)
--- a/alr_envs/utils/policies.py
+++ b/alr_envs/utils/policies.py
@ -1,15 +1,37 @@
-class PDController:
+from alr_envs.mujoco.alr_mujoco_env import AlrMujocoEnv
    def __init__(self, p_gains, d_gains):
        self.p_gains = p_gains
        self.d_gains = d_gains
-    def get_action(self, env, des_pos, des_vel):
+
 class BaseController:
    def __init__(self, env: AlrMujocoEnv):
        self.env = env
    def get_action(self, des_pos, des_vel):
        raise NotImplementedError
 class PosController(BaseController):
    def get_action(self, des_pos, des_vel):
        return des_pos
 class VelController(BaseController):
    def get_action(self, des_pos, des_vel):
        return des_vel
 class PDController(BaseController):
    def __init__(self, env):
        self.p_gains = env.p_gains
        self.d_gains = env.d_gains
        super(PDController, self).__init__(env)
    def get_action(self, des_pos, des_vel):
        # TODO: make standardized ALRenv such that all of them have current_pos/vel attributes
-        cur_pos = env.current_pos
+        cur_pos = self.env.current_pos
-        cur_vel = env.current_vel
+        cur_vel = self.env.current_vel
        if len(des_pos) != len(cur_pos):
-            des_pos = env.extend_des_pos(des_pos)
+            des_pos = self.env.extend_des_pos(des_pos)
        if len(des_vel) != len(cur_vel):
-            des_vel = env.extend_des_vel(des_vel)
+            des_vel = self.env.extend_des_vel(des_vel)
        trq = self.p_gains * (des_pos - cur_pos) + self.d_gains * (des_vel - cur_vel)
        return trq
--- a/dmp_pd_control_example.py
+++ b/dmp_pd_control_example.py
@ -1,7 +1,7 @@
-from alr_envs.utils.dmp_env_wrapper import DmpEnvWrapperPD
+from alr_envs.utils.dmp_env_wrapper import DmpEnvWrapper
 from alr_envs.utils.policies import PDController
 from alr_envs.utils.dmp_async_vec_env import DmpAsyncVectorEnv, _worker
-from alr_envs.mujoco.reacher.alr_reacher import ALRReacherEnv
+from alr_envs.mujoco.ball_in_a_cup.ball_in_a_cup_simple import ALRBallInACupEnv
 from alr_envs.mujoco.ball_in_a_cup.ball_in_a_cup_reward import BallInACupReward
 import numpy as np
@ -17,32 +17,42 @@ if __name__ == "__main__":
        :param rank: (int) index of the subprocess
        """
        def _init():
-            p_gains = np.array([100, 100, 100, 100, 100])
+            _env = ALRBallInACupEnv(BallInACupReward)
            d_gains = np.array([1, 1, 1, 1, 1])
            policy = PDController(p_gains, d_gains)
-            env = ALRReacherEnv()
+            _env = DmpEnvWrapper(_env,
-
+                                 num_dof=3,
-            env = DmpEnvWrapperPD(env,
+                                 num_basis=8,
-                                  num_dof=5,
+                                 duration=3.5,
-                                  num_basis=5,
+                                 alpha_phase=3,
-                                  duration=4,
+                                 dt=_env.dt,
-                                  dt=env.dt,
+                                 learn_goal=False,
-                                  learn_goal=False,
+                                 start_pos=_env.start_pos[1::2],
-                                  start_pos=env.init_qpos[:5],
+                                 final_pos=_env.start_pos[1::2],
-                                  final_pos=env.init_qpos[:5],
+                                 policy_type="motor"
-                                  alpha_phase=2,
+                                 # contextual=True
-                                  policy=policy
+                                 )
-                                  )
+            _env.seed(seed + rank)
-            env.seed(seed + rank)
+            return _env
            return env
        return _init
-    dim = 25
+    dim = 24
-    env = make_env(0, 0)()
+
    n_samples = 10
    vec_env = DmpAsyncVectorEnv([make_env(i) for i in range(4)],
                                n_samples=n_samples,
                                context="spawn",
                                shared_memory=False,
                                worker=_worker)
    params = 10 * np.random.randn(n_samples, dim)
    out = vec_env(params)
    non_vec_env = make_env(0, 0)()
    params = 10 * np.random.randn(dim)
-    out = env.rollout(params, render=True)
+    out2 = non_vec_env.rollout(params, render=True)
-    print(out)
+    print(out2)