fancy_gym/alr_envs/envs/mujoco/beerpong/mp_wrapper.py

from typing import Union, Tuple

import numpy as np

from alr_envs.black_box.raw_interface_wrapper import RawInterfaceWrapper


class MPWrapper(RawInterfaceWrapper):

    @property
    def context_mask(self) -> np.ndarray:
        return np.hstack([
            [False] * 7,  # cos
            [False] * 7,  # sin
            [False] * 7,  # joint velocities
            [False] * 3,  # cup_goal_diff_final
            [False] * 3,  # cup_goal_diff_top
            [True] * 2,  # xy position of cup
            # [False]  # env steps
        ])

    @property
    def current_pos(self) -> Union[float, int, np.ndarray, Tuple]:
        return self.data.qpos[0:7].copy()

    @property
    def current_vel(self) -> Union[float, int, np.ndarray, Tuple]:
        return self.data.qvel[0:7].copy()

    # TODO: Fix this
    def _episode_callback(self, action: np.ndarray, mp) -> Tuple[np.ndarray, Union[np.ndarray, None]]:
        if mp.learn_tau:
            self.release_step = action[0] / self.dt  # Tau value
            return action, None
        else:
            return action, None

    def set_context(self, context):
        xyz = np.zeros(3)
        xyz[:2] = context
        xyz[-1] = 0.840
        self.model.body_pos[self.cup_table_id] = xyz
        return self.get_observation_from_step(self.get_obs())
mp wrapper beer pong 2022-07-06 09:18:41 +02:00			`from typing import Union, Tuple`

			`import numpy as np`

			`from alr_envs.black_box.raw_interface_wrapper import RawInterfaceWrapper`


			`class MPWrapper(RawInterfaceWrapper):`

bugfixes 2022-07-07 10:47:04 +02:00			`@property`
			`def context_mask(self) -> np.ndarray:`
mp wrapper beer pong 2022-07-06 09:18:41 +02:00			`return np.hstack([`
			`[False] * 7, # cos`
			`[False] * 7, # sin`
			`[False] * 7, # joint velocities`
			`[False] * 3, # cup_goal_diff_final`
			`[False] * 3, # cup_goal_diff_top`
			`[True] * 2, # xy position of cup`
bugfixes 2022-07-07 10:47:04 +02:00			`# [False] # env steps`
mp wrapper beer pong 2022-07-06 09:18:41 +02:00			`])`

			`@property`
			`def current_pos(self) -> Union[float, int, np.ndarray, Tuple]:`
removed dependency on mujoco-py 2022-07-13 13:28:39 +02:00			`return self.data.qpos[0:7].copy()`
mp wrapper beer pong 2022-07-06 09:18:41 +02:00
			`@property`
			`def current_vel(self) -> Union[float, int, np.ndarray, Tuple]:`
removed dependency on mujoco-py 2022-07-13 13:28:39 +02:00			`return self.data.qvel[0:7].copy()`
mp wrapper beer pong 2022-07-06 09:18:41 +02:00
			`# TODO: Fix this`
			`def _episode_callback(self, action: np.ndarray, mp) -> Tuple[np.ndarray, Union[np.ndarray, None]]:`
			`if mp.learn_tau:`
removed dependency on mujoco-py 2022-07-13 13:28:39 +02:00			`self.release_step = action[0] / self.dt # Tau value`
mp wrapper beer pong 2022-07-06 09:18:41 +02:00			`return action, None`
			`else:`
			`return action, None`

			`def set_context(self, context):`
			`xyz = np.zeros(3)`
			`xyz[:2] = context`
			`xyz[-1] = 0.840`
removed dependency on mujoco-py 2022-07-13 13:28:39 +02:00			`self.model.body_pos[self.cup_table_id] = xyz`
			`return self.get_observation_from_step(self.get_obs())`