2021-11-05 11:04:04 +01:00
|
|
|
from typing import Tuple, Union
|
|
|
|
|
|
|
|
import numpy as np
|
|
|
|
|
2022-06-30 17:33:05 +02:00
|
|
|
from alr_envs.black_box.raw_interface_wrapper import RawInterfaceWrapper
|
2021-11-05 11:04:04 +01:00
|
|
|
|
|
|
|
|
2022-06-30 14:08:54 +02:00
|
|
|
class MPWrapper(RawInterfaceWrapper):
|
2021-11-05 11:04:04 +01:00
|
|
|
|
|
|
|
@property
|
2022-06-30 14:08:54 +02:00
|
|
|
def context_mask(self) -> np.ndarray:
|
2021-11-05 11:04:04 +01:00
|
|
|
# TODO: @Max Filter observations correctly
|
|
|
|
return np.hstack([
|
2022-02-08 09:50:01 +01:00
|
|
|
[False] * 7, # Joint Pos
|
|
|
|
[True] * 2, # Ball pos
|
|
|
|
[True] * 2 # goal pos
|
2021-11-05 11:04:04 +01:00
|
|
|
])
|
|
|
|
|
|
|
|
@property
|
|
|
|
def start_pos(self):
|
|
|
|
return self.self.init_qpos_tt
|
|
|
|
|
|
|
|
@property
|
|
|
|
def current_pos(self) -> Union[float, int, np.ndarray, Tuple]:
|
|
|
|
return self.sim.data.qpos[:7].copy()
|
|
|
|
|
|
|
|
@property
|
|
|
|
def current_vel(self) -> Union[float, int, np.ndarray, Tuple]:
|
|
|
|
return self.sim.data.qvel[:7].copy()
|
|
|
|
|
|
|
|
@property
|
|
|
|
def goal_pos(self):
|
|
|
|
# TODO: @Max I think the default value of returning to the start is reasonable here
|
|
|
|
raise ValueError("Goal position is not available and has to be learnt based on the environment.")
|
|
|
|
|
|
|
|
@property
|
|
|
|
def dt(self) -> Union[float, int]:
|
|
|
|
return self.env.dt
|