Merge remote-tracking branch 'origin/master' into Add-ProDMP-envs
# Conflicts: # fancy_gym/black_box/black_box_wrapper.py # fancy_gym/meta/__init__.py
This commit is contained in:
commit
176fb087af
@ -46,7 +46,7 @@ pip install -e .
|
||||
In case you want to use dm_control oder metaworld, you can install them by specifying extras
|
||||
|
||||
```bash
|
||||
pip install -e .[dmc, metaworld]
|
||||
pip install -e .[dmc,metaworld]
|
||||
```
|
||||
|
||||
> **Note:**
|
||||
@ -205,7 +205,7 @@ at the [examples](fancy_gym/examples/).
|
||||
import fancy_gym
|
||||
|
||||
# Base environment name, according to structure of above example
|
||||
base_env_id = "ball_in_cup-catch"
|
||||
base_env_id = "dmc:ball_in_cup-catch"
|
||||
|
||||
# Replace this wrapper with the custom wrapper for your environment by inheriting from the RawInferfaceWrapper.
|
||||
# You can also add other gym.Wrappers in case they are needed,
|
||||
|
@ -21,7 +21,9 @@ class BlackBoxWrapper(gym.ObservationWrapper):
|
||||
learn_sub_trajectories: bool = False,
|
||||
replanning_schedule: Optional[
|
||||
Callable[[np.ndarray, np.ndarray, np.ndarray, np.ndarray, int], bool]] = None,
|
||||
reward_aggregation: Callable[[np.ndarray], float] = np.sum
|
||||
reward_aggregation: Callable[[np.ndarray], float] = np.sum,
|
||||
max_planning_times: int = np.inf,
|
||||
condition_on_desired: bool = False
|
||||
):
|
||||
"""
|
||||
gym.Wrapper for leveraging a black box approach with a trajectory generator.
|
||||
@ -66,6 +68,14 @@ class BlackBoxWrapper(gym.ObservationWrapper):
|
||||
self.render_kwargs = {}
|
||||
self.verbose = verbose
|
||||
|
||||
# condition value
|
||||
self.condition_on_desired = condition_on_desired
|
||||
self.condition_pos = None
|
||||
self.condition_vel = None
|
||||
|
||||
self.max_planning_times = max_planning_times
|
||||
self.plan_steps = 0
|
||||
|
||||
def observation(self, observation):
|
||||
# return context space if we are
|
||||
if self.return_context_observation:
|
||||
@ -83,10 +93,12 @@ class BlackBoxWrapper(gym.ObservationWrapper):
|
||||
|
||||
clipped_params = np.clip(action, self.traj_gen_action_space.low, self.traj_gen_action_space.high)
|
||||
self.traj_gen.set_params(clipped_params)
|
||||
bc_time = np.array(0 if not self.do_replanning else self.current_traj_steps * self.dt)
|
||||
# TODO we could think about initializing with the previous desired value in order to have a smooth transition
|
||||
# at least from the planning point of view.
|
||||
self.traj_gen.set_initial_conditions(bc_time, self.current_pos, self.current_vel)
|
||||
init_time = np.array(0 if not self.do_replanning else self.current_traj_steps * self.dt)
|
||||
|
||||
condition_pos = self.condition_pos if self.condition_pos is not None else self.current_pos
|
||||
condition_vel = self.condition_vel if self.condition_vel is not None else self.current_vel
|
||||
|
||||
self.traj_gen.set_initial_conditions(init_time, condition_pos, condition_vel)
|
||||
self.traj_gen.set_duration(duration, self.dt)
|
||||
# traj_dict = self.traj_gen.get_trajs(get_pos=True, get_vel=True)
|
||||
position = get_numpy(self.traj_gen.get_traj_pos())
|
||||
@ -144,6 +156,7 @@ class BlackBoxWrapper(gym.ObservationWrapper):
|
||||
infos = dict()
|
||||
done = False
|
||||
|
||||
self.plan_steps += 1
|
||||
for t, (pos, vel) in enumerate(zip(position, velocity)):
|
||||
step_action = self.tracking_controller.get_action(pos, vel, self.current_pos, self.current_vel)
|
||||
c_action = np.clip(step_action, self.env.action_space.low, self.env.action_space.high)
|
||||
@ -162,8 +175,13 @@ class BlackBoxWrapper(gym.ObservationWrapper):
|
||||
if self.render_kwargs:
|
||||
self.env.render(**self.render_kwargs)
|
||||
|
||||
if done or self.replanning_schedule(self.current_pos, self.current_vel, obs, c_action,
|
||||
t + 1 + self.current_traj_steps):
|
||||
if done or (self.replanning_schedule(self.current_pos, self.current_vel, obs, c_action,
|
||||
t + 1 + self.current_traj_steps)
|
||||
and self.plan_steps < self.max_planning_times):
|
||||
|
||||
self.condition_pos = pos if self.condition_on_desired else None
|
||||
self.condition_vel = vel if self.condition_on_desired else None
|
||||
|
||||
break
|
||||
|
||||
infos.update({k: v[:t + 1] for k, v in infos.items()})
|
||||
@ -187,5 +205,8 @@ class BlackBoxWrapper(gym.ObservationWrapper):
|
||||
|
||||
def reset(self, *, seed: Optional[int] = None, return_info: bool = False, options: Optional[dict] = None):
|
||||
self.current_traj_steps = 0
|
||||
self.plan_steps = 0
|
||||
self.traj_gen.reset()
|
||||
self.condition_vel = None
|
||||
self.condition_pos = None
|
||||
return super(BlackBoxWrapper, self).reset()
|
||||
|
@ -16,6 +16,8 @@ from .mujoco.hopper_throw.hopper_throw import MAX_EPISODE_STEPS_HOPPERTHROW
|
||||
from .mujoco.hopper_throw.hopper_throw_in_basket import MAX_EPISODE_STEPS_HOPPERTHROWINBASKET
|
||||
from .mujoco.reacher.reacher import ReacherEnv, MAX_EPISODE_STEPS_REACHER
|
||||
from .mujoco.walker_2d_jump.walker_2d_jump import MAX_EPISODE_STEPS_WALKERJUMP
|
||||
from .mujoco.box_pushing.box_pushing_env import BoxPushingDense, BoxPushingTemporalSparse, \
|
||||
BoxPushingTemporalSpatialSparse, MAX_EPISODE_STEPS_BOX_PUSHING
|
||||
|
||||
ALL_FANCY_MOVEMENT_PRIMITIVE_ENVIRONMENTS = {"DMP": [], "ProMP": [], "ProDMP": []}
|
||||
|
||||
@ -36,7 +38,8 @@ DEFAULT_BB_DICT_ProMP = {
|
||||
"basis_generator_kwargs": {
|
||||
'basis_generator_type': 'zero_rbf',
|
||||
'num_basis': 5,
|
||||
'num_basis_zero_start': 1
|
||||
'num_basis_zero_start': 1,
|
||||
'basis_bandwidth_factor': 3.0,
|
||||
}
|
||||
}
|
||||
|
||||
@ -60,6 +63,29 @@ DEFAULT_BB_DICT_DMP = {
|
||||
}
|
||||
}
|
||||
|
||||
DEFAULT_BB_DICT_ProDMP = {
|
||||
"name": 'EnvName',
|
||||
"wrappers": [],
|
||||
"trajectory_generator_kwargs": {
|
||||
'trajectory_generator_type': 'prodmp',
|
||||
},
|
||||
"phase_generator_kwargs": {
|
||||
'phase_generator_type': 'exp',
|
||||
},
|
||||
"controller_kwargs": {
|
||||
'controller_type': 'motor',
|
||||
"p_gains": 1.0,
|
||||
"d_gains": 0.1,
|
||||
},
|
||||
"basis_generator_kwargs": {
|
||||
'basis_generator_type': 'prodmp',
|
||||
'alpha': 10,
|
||||
'num_basis': 5,
|
||||
},
|
||||
"black_box_kwargs": {
|
||||
}
|
||||
}
|
||||
|
||||
# Classic Control
|
||||
## Simple Reacher
|
||||
register(
|
||||
@ -197,6 +223,14 @@ register(
|
||||
max_episode_steps=MAX_EPISODE_STEPS_BEERPONG,
|
||||
)
|
||||
|
||||
# Box pushing environments with different rewards
|
||||
for reward_type in ["Dense", "TemporalSparse", "TemporalSpatialSparse"]:
|
||||
register(
|
||||
id='BoxPushing{}-v0'.format(reward_type),
|
||||
entry_point='fancy_gym.envs.mujoco:BoxPushing{}'.format(reward_type),
|
||||
max_episode_steps=MAX_EPISODE_STEPS_BOX_PUSHING,
|
||||
)
|
||||
|
||||
# Here we use the same reward as in BeerPong-v0, but now consider after the release,
|
||||
# only one time step, i.e. we simulate until the end of th episode
|
||||
register(
|
||||
@ -325,7 +359,6 @@ for _v in _versions:
|
||||
kwargs=kwargs_dict_reacher_promp
|
||||
)
|
||||
ALL_FANCY_MOVEMENT_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)
|
||||
|
||||
########################################################################################################################
|
||||
## Beerpong ProMP
|
||||
_versions = ['BeerPong-v0']
|
||||
@ -430,7 +463,50 @@ for _v in _versions:
|
||||
ALL_FANCY_MOVEMENT_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)
|
||||
|
||||
# ########################################################################################################################
|
||||
#
|
||||
|
||||
## Box Pushing
|
||||
_versions = ['BoxPushingDense-v0', 'BoxPushingTemporalSparse-v0', 'BoxPushingTemporalSpatialSparse-v0']
|
||||
for _v in _versions:
|
||||
_name = _v.split("-")
|
||||
_env_id = f'{_name[0]}ProMP-{_name[1]}'
|
||||
kwargs_dict_box_pushing_promp = deepcopy(DEFAULT_BB_DICT_ProMP)
|
||||
kwargs_dict_box_pushing_promp['wrappers'].append(mujoco.box_pushing.MPWrapper)
|
||||
kwargs_dict_box_pushing_promp['name'] = _v
|
||||
kwargs_dict_box_pushing_promp['controller_kwargs']['p_gains'] = 0.01 * np.array([120., 120., 120., 120., 50., 30., 10.])
|
||||
kwargs_dict_box_pushing_promp['controller_kwargs']['d_gains'] = 0.01 * np.array([10., 10., 10., 10., 6., 5., 3.])
|
||||
kwargs_dict_box_pushing_promp['basis_generator_kwargs']['basis_bandwidth_factor'] = 2 # 3.5, 4 to try
|
||||
|
||||
register(
|
||||
id=_env_id,
|
||||
entry_point='fancy_gym.utils.make_env_helpers:make_bb_env_helper',
|
||||
kwargs=kwargs_dict_box_pushing_promp
|
||||
)
|
||||
ALL_FANCY_MOVEMENT_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)
|
||||
|
||||
for _v in _versions:
|
||||
_name = _v.split("-")
|
||||
_env_id = f'{_name[0]}ReplanProDMP-{_name[1]}'
|
||||
kwargs_dict_box_pushing_prodmp = deepcopy(DEFAULT_BB_DICT_ProDMP)
|
||||
kwargs_dict_box_pushing_prodmp['wrappers'].append(mujoco.box_pushing.MPWrapper)
|
||||
kwargs_dict_box_pushing_prodmp['name'] = _v
|
||||
kwargs_dict_box_pushing_prodmp['controller_kwargs']['p_gains'] = 0.01 * np.array([120., 120., 120., 120., 50., 30., 10.])
|
||||
kwargs_dict_box_pushing_prodmp['controller_kwargs']['d_gains'] = 0.01 * np.array([10., 10., 10., 10., 6., 5., 3.])
|
||||
kwargs_dict_box_pushing_prodmp['trajectory_generator_kwargs']['weights_scale'] = 0.3
|
||||
kwargs_dict_box_pushing_prodmp['trajectory_generator_kwargs']['goal_scale'] = 0.3
|
||||
kwargs_dict_box_pushing_prodmp['trajectory_generator_kwargs']['auto_scale_basis'] = True
|
||||
kwargs_dict_box_pushing_prodmp['trajectory_generator_kwargs']['goal_offset'] = 1.0
|
||||
kwargs_dict_box_pushing_prodmp['basis_generator_kwargs']['num_basis'] = 4
|
||||
kwargs_dict_box_pushing_prodmp['basis_generator_kwargs']['basis_bandwidth_factor'] = 3
|
||||
kwargs_dict_box_pushing_prodmp['phase_generator_kwargs']['alpha_phase'] = 3
|
||||
kwargs_dict_box_pushing_prodmp['black_box_kwargs']['max_planning_times'] = 4
|
||||
kwargs_dict_box_pushing_prodmp['black_box_kwargs']['replanning_schedule'] = lambda pos, vel, obs, action, t : t % 25 == 0
|
||||
kwargs_dict_box_pushing_prodmp['black_box_kwargs']['condition_on_desired'] = True
|
||||
register(
|
||||
id=_env_id,
|
||||
entry_point='fancy_gym.utils.make_env_helpers:make_bb_env_helper',
|
||||
kwargs=kwargs_dict_box_pushing_prodmp
|
||||
)
|
||||
ALL_FANCY_MOVEMENT_PRIMITIVE_ENVIRONMENTS["ProDMP"].append(_env_id)
|
||||
#
|
||||
# ## Walker2DJump
|
||||
# _versions = ['Walker2DJump-v0']
|
||||
|
@ -7,3 +7,4 @@ from .hopper_throw.hopper_throw import HopperThrowEnv
|
||||
from .hopper_throw.hopper_throw_in_basket import HopperThrowInBasketEnv
|
||||
from .reacher.reacher import ReacherEnv
|
||||
from .walker_2d_jump.walker_2d_jump import Walker2dJumpEnv
|
||||
from .box_pushing.box_pushing_env import BoxPushingDense, BoxPushingTemporalSparse, BoxPushingTemporalSpatialSparse
|
||||
|
1
fancy_gym/envs/mujoco/box_pushing/__init__.py
Normal file
1
fancy_gym/envs/mujoco/box_pushing/__init__.py
Normal file
@ -0,0 +1 @@
|
||||
from .mp_wrapper import MPWrapper
|
42
fancy_gym/envs/mujoco/box_pushing/assets/box_pushing.xml
Normal file
42
fancy_gym/envs/mujoco/box_pushing/assets/box_pushing.xml
Normal file
@ -0,0 +1,42 @@
|
||||
<mujoco model="base_surrounding">
|
||||
<compiler angle="radian" discardvisual="false" />
|
||||
<option collision="all" cone="elliptic" gravity="0 0 -9.81" impratio="3" solver="Newton" timestep="0.002" tolerance="1e-10" />
|
||||
<size nconmax="2000" njmax="2000" />
|
||||
<asset>
|
||||
<texture builtin="gradient" height="32" rgb1="0.26 0.58 0.51" rgb2="0.26 0.58 0.51" type="skybox" width="32" />
|
||||
</asset>
|
||||
<visual>
|
||||
<map zfar="1000" znear="0.001" />
|
||||
</visual>
|
||||
<worldbody>
|
||||
<light castshadow="true" cutoff="100" diffuse="1 1 1" dir="-0 0 -1.3" directional="true" exponent="1" pos="0 0 1.3" specular=".1 .1 .1" />
|
||||
<body name="ground" pos="0 0 -0.94">
|
||||
<geom name="ground:geom1" rgba="0.26 0.58 0.51 1" size="0 0 1" type="plane" />
|
||||
</body>
|
||||
<!-- <body name="goal" pos="0.5 0 0.2" quat="1 0 0 0">-->
|
||||
<!-- <geom type="sphere" mass="0.1" size="0.01" rgba="1 0 0 1" />-->
|
||||
<!-- </body>-->
|
||||
<!-- <body name="box" pos="0.5 0 0.1" quat="1 0 0 0">-->
|
||||
<!-- <geom type="box" mass="1" size="0.02 0.02 0.02" rgba="0.32 0.32 0.32 1" />-->
|
||||
<!-- </body>-->
|
||||
<body name="target_pos" pos="0.5 0.5 0.0">
|
||||
<site type="box" pos="0 0 0" rgba="0 1 0 0.3" size="0.05 0.05 0.01" />
|
||||
<site pos="0.05 0 0.0485" size="0.005 0.05 0.045" rgba="0 0 1 0.5" type="box"/>
|
||||
<site pos="0 0.05 0.0485" size="0.05 0.005 0.045" rgba="0 1 0 0.5" type="box"/>
|
||||
<site pos="-0.05 0 0.0485" size="0.005 0.05 0.045" rgba="0 1 0 0.5" type="box"/>
|
||||
<site pos="0 -0.05 0.0485" size="0.05 0.005 0.045" rgba="0 1 0 0.5" type="box"/>
|
||||
</body>
|
||||
|
||||
<body name="replan_target_pos" pos="0.5 0.5 -0.01">
|
||||
<site type="box" pos="0 0 0" rgba="1 1 0 0.3" size="0.05 0.05 0.01" />
|
||||
<site pos="0.05 0 0.0485" size="0.005 0.05 0.045" rgba="0 0 1 0.5" type="box"/>
|
||||
<site pos="0 0.05 0.0485" size="0.05 0.005 0.045" rgba="1 1 0 0.5" type="box"/>
|
||||
<site pos="-0.05 0 0.0485" size="0.005 0.05 0.045" rgba="1 1 0 0.5" type="box"/>
|
||||
<site pos="0 -0.05 0.0485" size="0.05 0.005 0.045" rgba="1 1 0 0.5" type="box"/>
|
||||
</body>
|
||||
</worldbody>
|
||||
|
||||
<include file="kit_lab_surrounding.xml" />
|
||||
<include file="panda_rod.xml" />
|
||||
<include file="push_box.xml" />
|
||||
</mujoco>
|
118
fancy_gym/envs/mujoco/box_pushing/assets/kit_lab_surrounding.xml
Normal file
118
fancy_gym/envs/mujoco/box_pushing/assets/kit_lab_surrounding.xml
Normal file
@ -0,0 +1,118 @@
|
||||
<mujoco model="PandaFrame">
|
||||
<worldbody>
|
||||
<body name="table_plane" pos="0.2 0 -0.02">
|
||||
<geom type="box" size="0.49 0.98 0.001" rgba="0.8 0.655 0.45 1" solimp="0.999 0.999 0.001"
|
||||
solref="0.002 1"/>
|
||||
|
||||
<body name="panda_ground" pos="-0.24 0 0.01">
|
||||
<geom type="box" size="0.18 0.18 0.01" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
|
||||
<body name="front_upper" pos="0.49 0 -0.02">
|
||||
<geom type="box" size="0.02 0.96 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="front_mid" pos="0.49 0 -0.445">
|
||||
<geom type="box" size="0.02 0.96 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="front_lower" pos="0.49 0 -0.87">
|
||||
<geom type="box" size="0.02 0.96 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
|
||||
<body name="back_upper" pos="-0.49 0 -0.02">
|
||||
<geom type="box" size="0.02 0.96 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="back_mid" pos="-0.49 0 -0.445">
|
||||
<geom type="box" size="0.02 0.96 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="back_lower" pos="-0.49 0 -0.87">
|
||||
<geom type="box" size="0.02 0.96 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
|
||||
<body name="vert_front_left" pos="0.49 0.98 -0.445">
|
||||
<geom type="box" size="0.02 0.02 0.445" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="vert_front_right" pos="0.49 -0.98 -0.445">
|
||||
<geom type="box" size="0.02 0.02 0.445" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="vert_back_left" pos="-0.49 0.98 -0.445">
|
||||
<geom type="box" size="0.02 0.02 0.445" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="vert_back_right" pos="-0.49 -0.98 -0.445">
|
||||
<geom type="box" size="0.02 0.02 0.445" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
|
||||
<body name="side_upper_right" pos="0 -0.98 -0.02">
|
||||
<geom type="box" size="0.47 0.02 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="side_lower_right" pos="0 -0.98 -0.87">
|
||||
<geom type="box" size="0.47 0.02 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
|
||||
<body name="side_upper_left" pos="0 0.98 -0.02">
|
||||
<geom type="box" size="0.47 0.02 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="side_lower_left" pos="0 0.98 -0.87">
|
||||
<geom type="box" size="0.47 0.02 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
|
||||
<body name="foot_front_left" pos="0.49 0.98 -0.9">
|
||||
<geom type="cylinder" size="0.02 0.02 0.04" rgba="0 0 0 1"/>
|
||||
</body>
|
||||
<body name="foot_front_mid" pos="0.49 0 -0.9">
|
||||
<geom type="cylinder" size="0.02 0.02 0.04" rgba="0 0 0 1"/>
|
||||
</body>
|
||||
<body name="foot_front_right" pos="0.49 -0.98 -0.9">
|
||||
<geom type="cylinder" size="0.02 0.02 0.04" rgba="0 0 0 1"/>
|
||||
</body>
|
||||
|
||||
<body name="foot_back_left" pos="-0.49 0.98 -0.9">
|
||||
<geom type="cylinder" size="0.02 0.02 0.04" rgba="0 0 0 1"/>
|
||||
</body>
|
||||
<body name="foot_back_mid" pos="-0.49 0 -0.9">
|
||||
<geom type="cylinder" size="0.02 0.02 0.04" rgba="0 0 0 1"/>
|
||||
</body>
|
||||
<body name="foot_back_right" pos="-0.49 -0.98 -0.9">
|
||||
<geom type="cylinder" size="0.02 0.02 0.04" rgba="0 0 0 1"/>
|
||||
</body>
|
||||
|
||||
<body name="top_back_left" pos="-0.49 0.98 0.65">
|
||||
<geom type="box" size="0.02 0.02 0.65" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="top_back_right" pos="-0.49 -0.98 0.65">
|
||||
<geom type="box" size="0.02 0.02 0.65" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="top_front" pos="0.49 0 1.28">
|
||||
<geom type="box" size="0.02 0.96 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="top_back" pos="-0.49 0 1.28">
|
||||
<geom type="box" size="0.02 0.96 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="top_side_right" pos="0 -0.98 1.28">
|
||||
<geom type="box" size="0.51 0.02 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="top_side_mid" pos="0 0 1.28">
|
||||
<geom type="box" size="0.51 0.02 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="top_side_left" pos="0 0.98 1.28">
|
||||
<geom type="box" size="0.51 0.02 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
|
||||
<body name="rot_lower_right" pos="-0.31 0.98 0.22" quat="0.2 0 0.1 0">
|
||||
<geom type="box" size="0.3 0.02 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="rot_lower_left" pos="-0.31 -0.98 0.22" quat="0.2 0 0.1 0">
|
||||
<geom type="box" size="0.3 0.02 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="rot_upper_right" pos="-0.31 0.98 1.04" quat="0.1 0 0.2 0">
|
||||
<geom type="box" size="0.3 0.02 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
<body name="rot_upper_left" pos="-0.31 -0.98 1.04" quat="0.1 0 0.2 0">
|
||||
<geom type="box" size="0.3 0.02 0.02" rgba=".9 .9 .9 1"/>
|
||||
</body>
|
||||
|
||||
<body name="support_body" pos="0 0 -0.4" >
|
||||
<geom type="box" size="0.49 0.98 0.4" rgba="0 0 0 0" solimp="0.999 0.999 0.001" solref="0.002 1"/>
|
||||
</body>
|
||||
</body>
|
||||
</worldbody>
|
||||
</mujoco>
|
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/d435v.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/d435v.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/finger.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/finger.stl
Normal file
Binary file not shown.
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/hand.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/hand.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/handv.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/handv.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link0.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link0.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link0v.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link0v.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link1.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link1.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link1v.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link1v.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link2.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link2.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link2v.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link2v.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link3.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link3.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link3v.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link3v.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link4.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link4.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link4v.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link4v.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link5.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link5.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link5v.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link5v.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link6.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link6.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link6v.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link6v.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link7.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link7.stl
Normal file
Binary file not shown.
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link7v.stl
Normal file
BIN
fancy_gym/envs/mujoco/box_pushing/assets/meshes/panda/link7v.stl
Normal file
Binary file not shown.
159
fancy_gym/envs/mujoco/box_pushing/assets/panda_rod.xml
Normal file
159
fancy_gym/envs/mujoco/box_pushing/assets/panda_rod.xml
Normal file
@ -0,0 +1,159 @@
|
||||
<mujocoinclude>
|
||||
<compiler angle="radian" discardvisual="false" meshdir="./meshes/panda/"/>
|
||||
<asset>
|
||||
<mesh file="link0v.stl" name="link0v"/>
|
||||
<mesh file="link1v.stl" name="link1v"/>
|
||||
<mesh file="link2v.stl" name="link2v"/>
|
||||
<mesh file="link3v.stl" name="link3v"/>
|
||||
<mesh file="link4v.stl" name="link4v"/>
|
||||
<mesh file="link5v.stl" name="link5v"/>
|
||||
<mesh file="link6v.stl" name="link6v"/>
|
||||
<mesh file="link7v.stl" name="link7v"/>
|
||||
<mesh file="handv.stl" name="handv"/>
|
||||
<mesh file="fingerv.stl" name="fingerv"/>
|
||||
</asset>
|
||||
<contact>
|
||||
<exclude body1="panda_link0" body2="panda_link1"/>
|
||||
<exclude body1="panda_link1" body2="panda_link2"/>
|
||||
<exclude body1="panda_link2" body2="panda_link3"/>
|
||||
<exclude body1="panda_link3" body2="panda_link4"/>
|
||||
<exclude body1="panda_link4" body2="panda_link5"/>
|
||||
<exclude body1="panda_link5" body2="panda_link6"/>
|
||||
<exclude body1="panda_link6" body2="panda_link7"/>
|
||||
<exclude body1="panda_link7" body2="panda_link8"/>
|
||||
<exclude body1="panda_link8" body2="panda_hand"/>
|
||||
</contact>
|
||||
<worldbody>
|
||||
<body name="panda_link0" pos="0 0 0">
|
||||
<inertial diaginertia="0.0126801 0.0117603 0.00856656" mass="3.01399" pos="-0.0291898 -0.000879465 0.0566032"
|
||||
quat="0.00411744 0.564916 0.0132875 0.825031"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link0v" name="panda_link0:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link0v" name="panda_link0:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link1" pos="0 0 0.333">
|
||||
<inertial diaginertia="0.0164224 0.0153969 0.00546286" mass="2.77281" pos="1.1399e-05 -0.0312655 -0.0693733"
|
||||
quat="0.98466 0.174481 -0.000101815 0.000347662"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint1" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link1v" name="panda_joint1:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link1v" name="panda_joint1:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link2" pos="0 0 0" quat="0.707107 -0.707107 0 0">
|
||||
<inertial diaginertia="0.016787 0.0157415 0.00553027" mass="2.7996" pos="-1.31766e-05 -0.0703216 0.0311782"
|
||||
quat="0.57484 0.818266 -6.05764e-05 -6.61626e-05"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint2" pos="0 0 0" range="-1.8326
|
||||
1.8326"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link2v" name="panda_joint2:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link2v" name="panda_joint2:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link3" pos="0 -0.316 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.00915257 0.00896477 0.00384742" mass="2.14603" pos="0.0443483 0.0249283 -0.03813"
|
||||
quat="0.0615263 0.349824 0.234291 0.904956"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint3" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link3v" name="panda_joint3:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link3v" name="panda_joint3:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link4" pos="0.0825 0 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.00946899 0.00928491 0.00396694" mass="2.18807" pos="-0.0385503 0.0395256 0.0247162"
|
||||
quat="0.813566 0.465041 0.309792 0.160858"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint4" pos="0 0 0" range="-3.1416 0.0873"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link4v" name="panda_link4:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link4v" name="panda_link4:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link5" pos="-0.0825 0.384 0" quat="0.707107 -0.707107 0 0">
|
||||
<inertial diaginertia="0.0278873 0.0268823 0.00569569" mass="3.19545" pos="-6.36776e-05 0.0384124 -0.10997"
|
||||
quat="0.990767 -0.135571 0.000963106 0.000694406"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint5" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link5v" name="panda_link5:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link5v" name="panda_link5:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link6" pos="0 0 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.00412168 0.0033698 0.00213304" mass="1.35761" pos="0.0510023 0.00693267 0.00616899"
|
||||
quat="-0.0460841 0.754362 0.044494 0.653325"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint6" pos="0 0 0" range="-0.0873 3.8223"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link6v" name="panda_link6:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link6v" name="panda_link6:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link7" pos="0.088 0 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.000637671 0.000528056 0.000279577" mass="0.417345"
|
||||
pos="0.0103614 0.0103596 0.0791078" quat="0.63547 0.278021 -0.670462 0.263369"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint7" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link7v" name="panda_link7:geom1" rgba="1 1 1 1"
|
||||
type="mesh"/>
|
||||
<geom mesh="link7v" name="panda_link7:geom2" rgba="1 1 1 1" solimp="1.998 1.999 0" type="mesh"/>
|
||||
<body name="panda_link8" pos="0 0 0.107">
|
||||
<inertial diaginertia="0.1 0.1 0.1" mass="0.1" pos="0 0 0"/>
|
||||
<body name="panda_hand" pos="0 0 0" quat="0.92388 0 0 -0.382683">
|
||||
<inertial diaginertia="0.00227632 0.00206087 0.000456542" mass="0.670782"
|
||||
pos="-2.76618e-06 -0.00061547 0.0239295" quat="0.697945 0.716151 -0.000242485 8.47563e-05"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="handv" name="panda_hand:geom1" type="mesh"/>
|
||||
<geom mesh="handv" name="panda_hand:geom2" solimp="1.998 1.999 0" type="mesh"/>
|
||||
<camera euler="0 3.14 0" fovy="60" ipd="0.0" mode="fixed" name="rgbd" pos="0.1 0.0 0."/>
|
||||
<body name="tcp" pos="0 0 0.105">
|
||||
<site name="tcp" rgba='0 0 1 0' size='0.001'/>
|
||||
</body>
|
||||
|
||||
<!-- PUSHROD -->
|
||||
<body name="push_rod">
|
||||
<geom type="cylinder" size="0.01 0.15" pos="0 0 0.075"/>
|
||||
<site name="rod_tip" type="box" rgba="0 0 1 1." size="0.01 0.01 0.01" pos="0 0 0.2"/>
|
||||
</body>
|
||||
|
||||
<body childclass="panda:gripper" name="panda_leftfinger" pos="0 0 0.0584">
|
||||
<inertial diaginertia="5.69661e-06 5.56035e-06 1.55183e-06" mass="0.0218754"
|
||||
pos="-2.42335e-05 0.0119585 0.0237816" quat="0.996177 0.0868631 -2.79377e-05 -0.00926642"/>
|
||||
<joint axis="0 1 0" name="panda_finger_joint1"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="fingerv" name="panda_leftfinger:geom1" type="mesh"/>
|
||||
<geom mesh="fingerv" name="panda_leftfinger:geom2" type="mesh"/>
|
||||
<site name="panda_leftfinger:site" pos="0 0.012 0.045" rgba="0 0 1 0" size="0.012 0.015 0.012" type="box"/>
|
||||
<body name="finger_joint1_tip" pos="0 0.0085 0.056">
|
||||
<inertial diaginertia="0.01 0.01 0.01" mass="0.01" pos="0 0 0" quat="0 0 0 1"/>
|
||||
<geom conaffinity="1" condim="4" contype="1" friction="2 0.05 0.0001" name="finger1_tip_collision"
|
||||
pos="0 -0.005 -0.012" quat="0 0 0 1" rgba="1 0 0 1" size="0.008 0.004 0.008" solref="0.01 0.5"
|
||||
type="box"/>
|
||||
</body>
|
||||
</body>
|
||||
<body childclass="panda:gripper" name="panda_rightfinger" pos="0 0 0.0584">
|
||||
<inertial diaginertia="5.69661e-06 5.56035e-06 1.55183e-06" mass="0.0218754"
|
||||
pos="2.42335e-05 -0.0119585 0.0237816" quat="0.996177 -0.0868631 2.79377e-05 -0.00926642"/>
|
||||
<joint axis="0 -1 0" name="panda_finger_joint2"/>
|
||||
<site name="panda_rightfinger:site" pos="0 -0.012 0.045" rgba="0 0 1 0" size="0.012 0.015 0.012"
|
||||
type="box"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="fingerv" name="panda_rightfinger:geom1" quat="0 0 0 1"
|
||||
type="mesh"/>
|
||||
<geom condim="4" mesh="fingerv" name="panda_rightfinger:geom2" quat="0 0 0 1" type="mesh"/>
|
||||
<body name="finger_joint2_tip" pos="0 -0.0085 0.056">
|
||||
<inertial diaginertia="0.01 0.01 0.01" mass="0.01" pos="0 0 0" quat="0 0 0 1"/>
|
||||
<geom conaffinity="1" condim="4" contype="1" friction="2 0.05 0.0001" name="finger2_tip_collision"
|
||||
pos="0 0.005 -0.012" quat="0 0 0 1" rgba="1 0 0 1" size="0.008 0.004 0.008" solref="0.01 0.5"
|
||||
type="box"/>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
<camera euler="0 0 0" fovy="45" ipd="0.0" mode="fixed" name="rgbd_cage" pos="0.7 0.1 0.9"/>
|
||||
</worldbody>
|
||||
<sensor>
|
||||
<touch name="touchsensor:left" site="panda_leftfinger:site"/>
|
||||
<touch name="touchsensor:right" site="panda_rightfinger:site"/>
|
||||
</sensor>
|
||||
<default>
|
||||
<default class="panda:gripper">
|
||||
<geom condim="4" friction="1 0.005 0.0001" margin="0.001" solimp="0.998 0.999 0.001" solref="0.02 1" type="box"/>
|
||||
<joint damping="10" limited="true" range="0 0.04" type="slide"/>
|
||||
</default>
|
||||
</default>
|
||||
<actuator>
|
||||
<motor forcelimited="true" forcerange="-87 87" joint="panda_joint1" name="panda_joint1_act"/>
|
||||
<motor forcelimited="true" forcerange="-87 87" joint="panda_joint2" name="panda_joint2_act"/>
|
||||
<motor forcelimited="true" forcerange="-87 87" joint="panda_joint3" name="panda_joint3_act"/>
|
||||
<motor forcelimited="true" forcerange="-87 87" joint="panda_joint4" name="panda_joint4_act"/>
|
||||
<motor forcelimited="true" forcerange="-12 12" joint="panda_joint5" name="panda_joint5_act"/>
|
||||
<motor forcelimited="true" forcerange="-12 12" joint="panda_joint6" name="panda_joint6_act"/>
|
||||
<motor forcelimited="true" forcerange="-12 12" joint="panda_joint7" name="panda_joint7_act"/>
|
||||
<!-- <position ctrllimited="true" ctrlrange="0.001 0.04" forcelimited="true" forcerange="-70 70"-->
|
||||
<!-- joint="panda_finger_joint1" kp="1000000" name="panda_finger_joint1_act"/>-->
|
||||
<!-- <position ctrllimited="true" ctrlrange="0.001 0.04" forcelimited="true" forcerange="-70 70"-->
|
||||
<!-- joint="panda_finger_joint2" kp="1000000" name="panda_finger_joint2_act"/>-->
|
||||
</actuator>
|
||||
</mujocoinclude>
|
12
fancy_gym/envs/mujoco/box_pushing/assets/push_box.xml
Normal file
12
fancy_gym/envs/mujoco/box_pushing/assets/push_box.xml
Normal file
@ -0,0 +1,12 @@
|
||||
<mujoco model="push_box">
|
||||
<worldbody>
|
||||
<body name="box_0" pos="0.6 0.15 0.0" quat="1 0 0 0">
|
||||
<geom pos="0 0 0" size="0.05 0.05 0.01" rgba="1 0 0 1.0" type="box" mass="2.0" friction="0.3 0.001 0.0001" priority="1"/>
|
||||
<geom pos="0.05 0 0.0485" size="0.005 0.05 0.045" rgba="0 0 1 1.0" type="box" mass="0.001"/>
|
||||
<geom pos="0 0.05 0.0485" size="0.05 0.005 0.045" rgba="1 0 0 1.0" type="box" mass="0.001"/>
|
||||
<geom pos="-0.05 0 0.0485" size="0.005 0.05 0.045" rgba="1 0 0 1.0" type="box" mass="0.001"/>
|
||||
<geom pos="0 -0.05 0.0485" size="0.05 0.005 0.045" rgba="1 0 0 1.0" type="box" mass="0.001"/>
|
||||
<joint name="box_joint" type="free"/>
|
||||
</body>
|
||||
</worldbody>
|
||||
</mujoco>
|
@ -0,0 +1,15 @@
|
||||
<mujocoinclude>
|
||||
<worldbody>
|
||||
<body mocap="true" name="panda:mocap" pos="0 0 0">
|
||||
<geom conaffinity="0" contype="0" pos="0 0 0" rgba="0 0.5 0 0.7" size="0.005 0.005 0.005" type="box" />
|
||||
<!-- <geom conaffinity="0" contype="0" pos="0 0 0" rgba="1 0 0 0.3" size="1 0.005 0.005" type="box" />-->
|
||||
<!-- <geom conaffinity="0" contype="0" pos="0 0 0" rgba="0 1 0 0.3" size="0.005 1 0.005" type="box" />-->
|
||||
<!-- <geom conaffinity="0" contype="0" pos="0 0 0" rgba="0 0 1 0.3" size="0.005 0.005 1" type="box" />-->
|
||||
</body>
|
||||
</worldbody>
|
||||
<equality>
|
||||
<weld body1="panda:mocap" body2="tcp" solref="0.001 1"/>
|
||||
</equality>
|
||||
</mujocoinclude>
|
||||
|
||||
|
@ -0,0 +1,50 @@
|
||||
<mujocoinclude>
|
||||
<actuator>
|
||||
<position class="panda" ctrlrange="-2.9671 2.9671" forcerange="-87 87" joint="panda_joint1" kp="8700.0"
|
||||
name="panda_joint1"/>
|
||||
<position class="panda" ctrlrange="-1.8326 1.8326" forcerange="-87 87" joint="panda_joint2" kp="8700.0"
|
||||
name="panda_joint2"/>
|
||||
<position class="panda" ctrlrange="-2.9671 2.9671" forcerange="-87 87" joint="panda_joint3" kp="8700.0"
|
||||
name="panda_joint3"/>
|
||||
<position class="panda" ctrlrange="-3.1416 0.0" forcerange="-87 87" joint="panda_joint4" kp="8700.0"
|
||||
name="panda_joint4"/>
|
||||
<position class="panda" ctrlrange="-2.9671 2.9671" forcerange="-12 12" joint="panda_joint5" kp="1200.0"
|
||||
name="panda_joint5"/>
|
||||
<position class="panda" ctrlrange="-3.7525 2.1817" forcerange="-12 12" joint="panda_joint6" kp="1200.0"
|
||||
name="panda_joint6"/>
|
||||
<position class="panda" ctrlrange="-2.9671 2.9671" forcerange="-12 12" joint="panda_joint7" kp="1200.0"
|
||||
name="panda_joint7"/>
|
||||
</actuator>
|
||||
|
||||
<default>
|
||||
<default class="panda">
|
||||
<joint axis="0 0 1" limited="true" pos="0 0 0"/>
|
||||
<position ctrllimited="true" forcelimited="true" user="1002 40 2001 -0.005 0.005"/>
|
||||
<default class="panda_viz">
|
||||
<geom conaffinity="0" contype="0" group="0" mass="0" rgba=".95 .99 .92 1" type="mesh"/>
|
||||
</default>
|
||||
|
||||
<default class="panda_col">
|
||||
<geom conaffinity="1" contype="1" group="3" rgba=".5 .6 .7 1" type="mesh"/>
|
||||
</default>
|
||||
<default class="panda_arm">
|
||||
<joint damping="100"/>
|
||||
</default>
|
||||
<default class="panda_forearm">
|
||||
<joint damping="10"/>
|
||||
</default>
|
||||
<default class="panda_finger">
|
||||
<joint armature="5" damping="100"/>
|
||||
<geom conaffinity="0" condim="6" contype="1" friction="1 0.5 0.0001" group="3" margin="0.001" rgba="0.5 0.6 0.7 .4"
|
||||
solimp="0.8 0.9 0.001" solref="0.01 1" user="0"/>
|
||||
<position user="1002 40 2001 -0.0001 0.0001"/>
|
||||
</default>
|
||||
</default>
|
||||
|
||||
<default class="panda_overlay">
|
||||
<joint armature="1" damping="1000" frictionloss="10" limited="false"/>
|
||||
<geom conaffinity="0" contype="0" group="2" rgba=".42 0.42 0.42 .5" type="mesh"/>
|
||||
</default>
|
||||
</default>
|
||||
|
||||
</mujocoinclude>
|
@ -0,0 +1,11 @@
|
||||
<mujoco model="torque">
|
||||
<actuator>
|
||||
<motor forcelimited="true" forcerange="-87 87" joint="panda_joint1" name="panda_joint1_act"/>
|
||||
<motor forcelimited="true" forcerange="-87 87" joint="panda_joint2" name="panda_joint2_act"/>
|
||||
<motor forcelimited="true" forcerange="-87 87" joint="panda_joint3" name="panda_joint3_act"/>
|
||||
<motor forcelimited="true" forcerange="-87 87" joint="panda_joint4" name="panda_joint4_act"/>
|
||||
<motor forcelimited="true" forcerange="-12 12" joint="panda_joint5" name="panda_joint5_act"/>
|
||||
<motor forcelimited="true" forcerange="-12 12" joint="panda_joint6" name="panda_joint6_act"/>
|
||||
<motor forcelimited="true" forcerange="-12 12" joint="panda_joint7" name="panda_joint7_act"/>
|
||||
</actuator>
|
||||
</mujoco>
|
@ -0,0 +1,13 @@
|
||||
<mujocoinclude>
|
||||
<actuator>
|
||||
<velocity ctrlrange="-2.1750 2.1750" forcerange="-87 87" joint="panda_joint1" kv="0.8" name="panda_joint1"/>
|
||||
<velocity ctrlrange="-2.1750 2.1750" forcerange="-87 87" joint="panda_joint2" kv="0.8" name="panda_joint2"/>
|
||||
<velocity ctrlrange="-2.1750 2.1750" forcerange="-87 87" joint="panda_joint3" kv="0.8" name="panda_joint3"/>
|
||||
<velocity ctrlrange="-2.1750 2.1750" forcerange="-87 87" joint="panda_joint4" kv="0.8" name="panda_joint4"/>
|
||||
<velocity ctrlrange="-2.6100 2.6100" forcerange="-12 12" joint="panda_joint5" kv="0.8" name="panda_joint5"/>
|
||||
<velocity ctrlrange="-2.6100 2.6100" forcerange="-12 12" joint="panda_joint6" kv="0.8" name="panda_joint6"/>
|
||||
<velocity ctrlrange="-2.9671 2.9671" forcerange="-12 12" joint="panda_joint7" kv="0.8" name="panda_joint7"/>
|
||||
</actuator>
|
||||
|
||||
|
||||
</mujocoinclude>
|
@ -0,0 +1,157 @@
|
||||
<mujoco model="panda">
|
||||
<compiler angle="radian" discardvisual="false" meshdir="../meshes_panda/for_mujoco/"/>
|
||||
<option cone="elliptic" impratio="20" timestep="0.002">
|
||||
</option>
|
||||
<size nconmax="2000" njmax="2000"/>
|
||||
<asset>
|
||||
<mesh file="link0v.stl" name="link0v"/>
|
||||
<mesh file="link1v.stl" name="link1v"/>
|
||||
<mesh file="link2v.stl" name="link2v"/>
|
||||
<mesh file="link3v.stl" name="link3v"/>
|
||||
<mesh file="link4v.stl" name="link4v"/>
|
||||
<mesh file="link5v.stl" name="link5v"/>
|
||||
<mesh file="link6v.stl" name="link6v"/>
|
||||
<mesh file="link7v.stl" name="link7v"/>
|
||||
<mesh file="handv.stl" name="handv"/>
|
||||
<mesh file="fingerv.stl" name="fingerv"/>
|
||||
<texture builtin="gradient" height="32" rgb1="0.26 0.58 0.51" rgb2="0.26 0.58 0.51" type="skybox" width="32"/>
|
||||
</asset>
|
||||
<contact>
|
||||
<exclude body1="panda_link0" body2="panda_link1"/>
|
||||
<exclude body1="panda_link1" body2="panda_link2"/>
|
||||
<exclude body1="panda_link2" body2="panda_link3"/>
|
||||
<exclude body1="panda_link3" body2="panda_link4"/>
|
||||
<exclude body1="panda_link4" body2="panda_link5"/>
|
||||
<exclude body1="panda_link5" body2="panda_link6"/>
|
||||
<exclude body1="panda_link6" body2="panda_link7"/>
|
||||
<exclude body1="panda_link7" body2="panda_link8"/>
|
||||
<exclude body1="panda_link8" body2="panda_hand"/>
|
||||
</contact>
|
||||
<visual>
|
||||
<map zfar="1000" znear="0.001"/>
|
||||
</visual>
|
||||
<worldbody>
|
||||
<light castshadow="false" cutoff="100" diffuse="1 1 1" dir="-0 0 -1.3" directional="true" exponent="1" pos="0 0 1.3"
|
||||
specular=".1 .1 .1"/>
|
||||
<body name="ground" pos="0 0 -0.94">
|
||||
<geom name="ground:geom1" rgba="0.26 0.58 0.51 1" size="0 0 1" type="plane"/>
|
||||
</body>
|
||||
<body name="panda_link0" pos="0 0 0">
|
||||
<inertial diaginertia="0.0126801 0.0117603 0.00856656" mass="3.01399" pos="-0.0291898 -0.000879465 0.0566032"
|
||||
quat="0.00411744 0.564916 0.0132875 0.825031"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link0v" name="panda_link0:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link0v" name="panda_link0:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body childclass="panda:body" name="panda_link1" pos="0 0 0.333">
|
||||
<inertial diaginertia="0.0164224 0.0153969 0.00546286" mass="2.77281" pos="1.1399e-05 -0.0312655 -0.0693733"
|
||||
quat="0.98466 0.174481 -0.000101815 0.000347662"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint1" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link1v" name="panda_joint1:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link1v" name="panda_joint1:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body childclass="panda:body" name="panda_link2" pos="0 0 0" quat="0.707107 -0.707107 0 0">
|
||||
<inertial diaginertia="0.016787 0.0157415 0.00553027" mass="2.7996" pos="-1.31766e-05 -0.0703216 0.0311782"
|
||||
quat="0.57484 0.818266 -6.05764e-05 -6.61626e-05"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint2" pos="0 0 0"
|
||||
range="-1.8326 1.8326"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link2v" name="panda_joint2:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link2v" name="panda_joint2:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body childclass="panda:body" name="panda_link3" pos="0 -0.316 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.00915257 0.00896477 0.00384742" mass="2.14603" pos="0.0443483 0.0249283 -0.03813"
|
||||
quat="0.0615263 0.349824 0.234291 0.904956"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint3" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link3v" name="panda_joint3:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link3v" name="panda_joint3:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body childclass="panda:body" name="panda_link4" pos="0.0825 0 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.00946899 0.00928491 0.00396694" mass="2.18807" pos="-0.0385503 0.0395256 0.0247162"
|
||||
quat="0.813566 0.465041 0.309792 0.160858"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint4" pos="0 0 0" range="-3.1416 0.0873"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link4v" name="panda_link4:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link4v" name="panda_link4:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body childclass="panda:body" name="panda_link5" pos="-0.0825 0.384 0" quat="0.707107 -0.707107 0 0">
|
||||
<inertial diaginertia="0.0278873 0.0268823 0.00569569" mass="3.19545" pos="-6.36776e-05 0.0384124 -0.10997"
|
||||
quat="0.990767 -0.135571 0.000963106 0.000694406"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint5" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link5v" name="panda_link5:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link5v" name="panda_link5:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body childclass="panda:body" name="panda_link6" pos="0 0 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.00412168 0.0033698 0.00213304" mass="1.35761" pos="0.0510023 0.00693267 0.00616899"
|
||||
quat="-0.0460841 0.754362 0.044494 0.653325"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint6" pos="0 0 0" range="-0.0873 3.8223"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link6v" name="panda_link6:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link6v" name="panda_link6:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body childclass="panda:body" name="panda_link7" pos="0.088 0 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.000637671 0.000528056 0.000279577" mass="0.417345"
|
||||
pos="0.0103614 0.0103596 0.0791078" quat="0.63547 0.278021 -0.670462 0.263369"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint7" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link7v" name="panda_link7:geom1" rgba="1 1 1 1"
|
||||
type="mesh"/>
|
||||
<geom mesh="link7v" name="panda_link7:geom2" rgba="1 1 1 1" solimp="1.998 1.999 0" type="mesh"/>
|
||||
<body name="panda_link8" pos="0 0 0.107">
|
||||
<inertial diaginertia="0.1 0.1 0.1" mass="0.1" pos="0 0 0"/>
|
||||
<body name="panda_hand" pos="0 0 0" quat="0.92388 0 0 -0.382683">
|
||||
<inertial diaginertia="0.00227632 0.00206087 0.000456542" mass="0.670782"
|
||||
pos="-2.76618e-06 -0.00061547 0.0239295" quat="0.697945 0.716151 -0.000242485 8.47563e-05"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="handv" name="panda_hand:geom1" type="mesh"/>
|
||||
<geom mesh="handv" name="panda_hand:geom2" solimp="1.998 1.999 0" type="mesh"/>
|
||||
<camera euler="0 3.14 0" fovy="60" ipd="0.0" mode="fixed" name="rgbd" pos="0.1 0.0 0."/>
|
||||
<body name="tcp" pos="0 0 0.1">
|
||||
<site name="tcp" rgba="0 0 1 0" size="0.001"/>
|
||||
</body>
|
||||
<body childclass="panda:gripper" name="panda_leftfinger" pos="0 0 0.0584">
|
||||
<inertial diaginertia="5.69661e-06 5.56035e-06 1.55183e-06" mass="0.0218754" pos="-2.42335e-05 0.0119585 0.0237816" quat="0.996177 0.0868631 -2.79377e-05 -0.00926642" />
|
||||
<joint axis="0 1 0" name="panda_finger_joint1" />
|
||||
<site name="panda_leftfinger:site" pos="0 0.012 0.045" rgba="0 0 1 0" size="0.012 0.015 0.012" type="box" />
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="fingerv" name="panda_leftfinger:geom1" type="mesh" />
|
||||
<geom mesh="fingerv" name="panda_leftfinger:geom2" type="mesh" />
|
||||
<body name="finger_joint1_tip" pos="0 0.0085 0.056">
|
||||
<inertial diaginertia="0.01 0.01 0.01" mass="0.01" pos="0 0 0" quat="0 0 0 1" />
|
||||
<geom conaffinity="1" condim="4" contype="1" friction="2 0.05 0.0001" name="finger1_tip_collision" pos="0 -0.005 -0.012" quat="0 0 0 1" rgba="1 0 0 1" size="0.008 0.004 0.008" solref="0.01 0.5" type="box" />
|
||||
<geom conaffinity="1" contype="1" name="touch_left" rgba="0 1 0 1" pos="0 -0.005 -0.012"
|
||||
quat="1 1 0 0" size="0.004 0.004" type="cylinder"/>
|
||||
</body>
|
||||
</body>
|
||||
<body childclass="panda:gripper" name="panda_rightfinger" pos="0 0 0.0584">
|
||||
<inertial diaginertia="5.69661e-06 5.56035e-06 1.55183e-06" mass="0.0218754" pos="2.42335e-05 -0.0119585 0.0237816" quat="0.996177 -0.0868631 2.79377e-05 -0.00926642" />
|
||||
<joint axis="0 -1 0" name="panda_finger_joint2" />
|
||||
<site name="panda_rightfinger:site" pos="0 -0.012 0.045" rgba="0 0 1 0" size="0.012 0.015 0.012" type="box" />
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="fingerv" name="panda_rightfinger:geom1" quat="0 0 0 1" type="mesh" />
|
||||
<geom mesh="fingerv" name="panda_rightfinger:geom2" quat="0 0 0 1" type="mesh" />
|
||||
<body name="finger_joint2_tip" pos="0 -0.0085 0.056">
|
||||
<inertial diaginertia="0.01 0.01 0.01" mass="0.01" pos="0 0 0" quat="0 0 0 1" />
|
||||
<geom conaffinity="1" condim="4" contype="1" friction="2 0.05 0.0001" name="finger2_tip_collision" pos="0 0.005 -0.012" quat="0 0 0 1" rgba="1 0 0 1" size="0.008 0.004 0.008" solref="0.01 0.5" type="box" />
|
||||
<geom conaffinity="1" contype="1" name="touch_right" rgba="0 1 0 1" pos="0 0.005 -0.012"
|
||||
quat="1 1 0 0" size="0.004 0.004" type="cylinder"/>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
<camera euler="0 0 0" fovy="45" ipd="0.0" mode="fixed" name="rgbd_cage" pos="0.7 0.1 0.9"/>
|
||||
</worldbody>
|
||||
<sensor>
|
||||
<touch name="touchsensor:left" site="panda_leftfinger:site"/>
|
||||
<touch name="touchsensor:right" site="panda_rightfinger:site"/>
|
||||
</sensor>
|
||||
<default>
|
||||
<default class="panda:body">
|
||||
<joint damping="0" />
|
||||
</default>
|
||||
<default class="panda:gripper">
|
||||
<geom condim="4" solimp="0.999 0.999 0.0001" type="box"/>
|
||||
<joint armature="10" damping="300" limited="true" range="0.001 0.04" type="slide"/>
|
||||
</default>
|
||||
</default>
|
||||
<actuator>
|
||||
<position ctrllimited="true" ctrlrange="0.001 0.04" forcelimited="true" forcerange="-70 70"
|
||||
joint="panda_finger_joint1" kp="1000000" name="panda_finger_joint1_act"/>
|
||||
<position ctrllimited="true" ctrlrange="0.001 0.04" forcelimited="true" forcerange="-70 70"
|
||||
joint="panda_finger_joint2" kp="1000000" name="panda_finger_joint2_act"/>
|
||||
</actuator>
|
||||
<include file="../assets/panda_frame.xml"/>
|
||||
</mujoco>
|
155
fancy_gym/envs/mujoco/box_pushing/assets/robots/panda.xml
Normal file
155
fancy_gym/envs/mujoco/box_pushing/assets/robots/panda.xml
Normal file
@ -0,0 +1,155 @@
|
||||
<mujocoinclude>
|
||||
<compiler angle="radian" discardvisual="false" meshdir="../robots/meshes/panda/"/>
|
||||
<asset>
|
||||
<mesh file="link0v.stl" name="link0v"/>
|
||||
<mesh file="link1v.stl" name="link1v"/>
|
||||
<mesh file="link2v.stl" name="link2v"/>
|
||||
<mesh file="link3v.stl" name="link3v"/>
|
||||
<mesh file="link4v.stl" name="link4v"/>
|
||||
<mesh file="link5v.stl" name="link5v"/>
|
||||
<mesh file="link6v.stl" name="link6v"/>
|
||||
<mesh file="link7v.stl" name="link7v"/>
|
||||
<mesh file="handv.stl" name="handv"/>
|
||||
<mesh file="fingerv.stl" name="fingerv"/>
|
||||
</asset>
|
||||
<contact>
|
||||
<exclude body1="panda_link0" body2="panda_link1"/>
|
||||
<exclude body1="panda_link1" body2="panda_link2"/>
|
||||
<exclude body1="panda_link2" body2="panda_link3"/>
|
||||
<exclude body1="panda_link3" body2="panda_link4"/>
|
||||
<exclude body1="panda_link4" body2="panda_link5"/>
|
||||
<exclude body1="panda_link5" body2="panda_link6"/>
|
||||
<exclude body1="panda_link6" body2="panda_link7"/>
|
||||
<exclude body1="panda_link7" body2="panda_link8"/>
|
||||
<exclude body1="panda_link8" body2="panda_hand"/>
|
||||
</contact>
|
||||
<worldbody>
|
||||
<body name="panda_link0" pos="0 0 0">
|
||||
<inertial diaginertia="0.0126801 0.0117603 0.00856656" mass="3.01399" pos="-0.0291898 -0.000879465 0.0566032"
|
||||
quat="0.00411744 0.564916 0.0132875 0.825031"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link0v" name="panda_link0:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link0v" name="panda_link0:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link1" pos="0 0 0.333">
|
||||
<inertial diaginertia="0.0164224 0.0153969 0.00546286" mass="2.77281" pos="1.1399e-05 -0.0312655 -0.0693733"
|
||||
quat="0.98466 0.174481 -0.000101815 0.000347662"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint1" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link1v" name="panda_joint1:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link1v" name="panda_joint1:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link2" pos="0 0 0" quat="0.707107 -0.707107 0 0">
|
||||
<inertial diaginertia="0.016787 0.0157415 0.00553027" mass="2.7996" pos="-1.31766e-05 -0.0703216 0.0311782"
|
||||
quat="0.57484 0.818266 -6.05764e-05 -6.61626e-05"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint2" pos="0 0 0" range="-1.8326
|
||||
1.8326"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link2v" name="panda_joint2:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link2v" name="panda_joint2:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link3" pos="0 -0.316 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.00915257 0.00896477 0.00384742" mass="2.14603" pos="0.0443483 0.0249283 -0.03813"
|
||||
quat="0.0615263 0.349824 0.234291 0.904956"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint3" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link3v" name="panda_joint3:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link3v" name="panda_joint3:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link4" pos="0.0825 0 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.00946899 0.00928491 0.00396694" mass="2.18807" pos="-0.0385503 0.0395256 0.0247162"
|
||||
quat="0.813566 0.465041 0.309792 0.160858"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint4" pos="0 0 0" range="-3.1416 0.0873"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link4v" name="panda_link4:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link4v" name="panda_link4:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link5" pos="-0.0825 0.384 0" quat="0.707107 -0.707107 0 0">
|
||||
<inertial diaginertia="0.0278873 0.0268823 0.00569569" mass="3.19545" pos="-6.36776e-05 0.0384124 -0.10997"
|
||||
quat="0.990767 -0.135571 0.000963106 0.000694406"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint5" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link5v" name="panda_link5:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link5v" name="panda_link5:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link6" pos="0 0 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.00412168 0.0033698 0.00213304" mass="1.35761" pos="0.0510023 0.00693267 0.00616899"
|
||||
quat="-0.0460841 0.754362 0.044494 0.653325"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint6" pos="0 0 0" range="-0.0873 3.8223"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link6v" name="panda_link6:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link6v" name="panda_link6:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link7" pos="0.088 0 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.000637671 0.000528056 0.000279577" mass="0.417345"
|
||||
pos="0.0103614 0.0103596 0.0791078" quat="0.63547 0.278021 -0.670462 0.263369"/>
|
||||
<joint axis="0 0 1" limited="true" name="panda_joint7" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link7v" name="panda_link7:geom1" rgba="1 1 1 1"
|
||||
type="mesh"/>
|
||||
<geom mesh="link7v" name="panda_link7:geom2" rgba="1 1 1 1" solimp="1.998 1.999 0" type="mesh"/>
|
||||
<body name="panda_link8" pos="0 0 0.107">
|
||||
<inertial diaginertia="0.1 0.1 0.1" mass="0.1" pos="0 0 0"/>
|
||||
<body name="panda_hand" pos="0 0 0" quat="0.92388 0 0 -0.382683">
|
||||
<inertial diaginertia="0.00227632 0.00206087 0.000456542" mass="0.670782"
|
||||
pos="-2.76618e-06 -0.00061547 0.0239295" quat="0.697945 0.716151 -0.000242485 8.47563e-05"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="handv" name="panda_hand:geom1" type="mesh"/>
|
||||
<geom mesh="handv" name="panda_hand:geom2" solimp="1.998 1.999 0" type="mesh"/>
|
||||
<camera euler="0 3.14 0" fovy="60" ipd="0.0" mode="fixed" name="rgbd" pos="0.1 0.0 0."/>
|
||||
<body name="tcp" pos="0 0 0.105">
|
||||
<site name="tcp" rgba="'0 0 1 0'" size='0.001'/>
|
||||
</body>
|
||||
<body childclass="panda:gripper" name="panda_leftfinger" pos="0 0 0.0584">
|
||||
<inertial diaginertia="5.69661e-06 5.56035e-06 1.55183e-06" mass="0.0218754"
|
||||
pos="-2.42335e-05 0.0119585 0.0237816" quat="0.996177 0.0868631 -2.79377e-05 -0.00926642"/>
|
||||
<joint axis="0 1 0" name="panda_finger_joint1"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="fingerv" name="panda_leftfinger:geom1" type="mesh"/>
|
||||
<geom mesh="fingerv" name="panda_leftfinger:geom2" type="mesh"/>
|
||||
<site name="panda_leftfinger:site" pos="0 0.012 0.045" rgba="0 0 1 0" size="0.012 0.015 0.012" type="box"/>
|
||||
<body name="finger_joint1_tip" pos="0 0.0085 0.056">
|
||||
<inertial diaginertia="0.01 0.01 0.01" mass="0.01" pos="0 0 0" quat="0 0 0 1"/>
|
||||
<geom conaffinity="1" condim="4" contype="1" friction="2 0.05 0.0001" name="finger1_tip_collision"
|
||||
pos="0 -0.005 -0.012" quat="0 0 0 1" rgba="1 0 0 1" size="0.008 0.004 0.008" solref="0.01 0.5"
|
||||
type="box"/>
|
||||
</body>
|
||||
</body>
|
||||
<body childclass="panda:gripper" name="panda_rightfinger" pos="0 0 0.0584">
|
||||
<inertial diaginertia="5.69661e-06 5.56035e-06 1.55183e-06" mass="0.0218754"
|
||||
pos="2.42335e-05 -0.0119585 0.0237816" quat="0.996177 -0.0868631 2.79377e-05 -0.00926642"/>
|
||||
<joint axis="0 -1 0" name="panda_finger_joint2"/>
|
||||
<site name="panda_rightfinger:site" pos="0 -0.012 0.045" rgba="0 0 1 0" size="0.012 0.015 0.012"
|
||||
type="box"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="fingerv" name="panda_rightfinger:geom1" quat="0 0 0 1"
|
||||
type="mesh"/>
|
||||
<geom condim="4" mesh="fingerv" name="panda_rightfinger:geom2" quat="0 0 0 1" type="mesh"/>
|
||||
<body name="finger_joint2_tip" pos="0 -0.0085 0.056">
|
||||
<inertial diaginertia="0.01 0.01 0.01" mass="0.01" pos="0 0 0" quat="0 0 0 1"/>
|
||||
<geom conaffinity="1" condim="4" contype="1" friction="2 0.05 0.0001" name="finger2_tip_collision"
|
||||
pos="0 0.005 -0.012" quat="0 0 0 1" rgba="1 0 0 1" size="0.008 0.004 0.008" solref="0.01 0.5"
|
||||
type="box"/>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
<camera euler="0 0 0" fovy="45" ipd="0.0" mode="fixed" name="rgbd_cage" pos="0.7 0.1 0.9"/>
|
||||
</worldbody>
|
||||
<sensor>
|
||||
<touch name="touchsensor:left" site="panda_leftfinger:site"/>
|
||||
<touch name="touchsensor:right" site="panda_rightfinger:site"/>
|
||||
</sensor>
|
||||
<default>
|
||||
<default class="panda:gripper">
|
||||
<geom condim="4" friction="1 0.005 0.0001" margin="0.001" solimp="0.998 0.999 0.001" solref="0.02 1" type="box"/>
|
||||
<joint damping="10" limited="true" range="0 0.04" type="slide"/>
|
||||
</default>
|
||||
</default>
|
||||
<actuator>
|
||||
<motor forcelimited="true" forcerange="-87 87" joint="panda_joint1" name="panda_joint1_act"/>
|
||||
<motor forcelimited="true" forcerange="-87 87" joint="panda_joint2" name="panda_joint2_act"/>
|
||||
<motor forcelimited="true" forcerange="-87 87" joint="panda_joint3" name="panda_joint3_act"/>
|
||||
<motor forcelimited="true" forcerange="-87 87" joint="panda_joint4" name="panda_joint4_act"/>
|
||||
<motor forcelimited="true" forcerange="-12 12" joint="panda_joint5" name="panda_joint5_act"/>
|
||||
<motor forcelimited="true" forcerange="-12 12" joint="panda_joint6" name="panda_joint6_act"/>
|
||||
<motor forcelimited="true" forcerange="-12 12" joint="panda_joint7" name="panda_joint7_act"/>
|
||||
<motor forcelimited="true" forcerange="-70 70" joint="panda_finger_joint1" name="panda_finger_joint1_act"/>
|
||||
<motor forcelimited="true" forcerange="-70 70" joint="panda_finger_joint2" name="panda_finger_joint2_act"/>
|
||||
<!--<position ctrllimited="true" ctrlrange="0.001 0.04" forcelimited="true" forcerange="-70 70"
|
||||
joint="panda_finger_joint1" kp="1000000" name="panda_finger_joint1_act"/>
|
||||
<position ctrllimited="true" ctrlrange="0.001 0.04" forcelimited="true" forcerange="-70 70"
|
||||
joint="panda_finger_joint2" kp="1000000" name="panda_finger_joint2_act"/>-->
|
||||
|
||||
</actuator>
|
||||
</mujocoinclude>
|
@ -0,0 +1 @@
|
||||
<!--todo-->
|
140
fancy_gym/envs/mujoco/box_pushing/assets/robots/panda_mocap.xml
Normal file
140
fancy_gym/envs/mujoco/box_pushing/assets/robots/panda_mocap.xml
Normal file
@ -0,0 +1,140 @@
|
||||
<mujocoinclude>
|
||||
<compiler angle="radian" discardvisual="false" meshdir="../robots/meshes/panda/"/>
|
||||
<asset>
|
||||
<mesh file="link0v.stl" name="link0v"/>
|
||||
<mesh file="link1v.stl" name="link1v"/>
|
||||
<mesh file="link2v.stl" name="link2v"/>
|
||||
<mesh file="link3v.stl" name="link3v"/>
|
||||
<mesh file="link4v.stl" name="link4v"/>
|
||||
<mesh file="link5v.stl" name="link5v"/>
|
||||
<mesh file="link6v.stl" name="link6v"/>
|
||||
<mesh file="link7v.stl" name="link7v"/>
|
||||
<mesh file="handv.stl" name="handv"/>
|
||||
<mesh file="fingerv.stl" name="fingerv"/>
|
||||
</asset>
|
||||
<contact>
|
||||
<exclude body1="panda_link0" body2="panda_link1"/>
|
||||
<exclude body1="panda_link1" body2="panda_link2"/>
|
||||
<exclude body1="panda_link2" body2="panda_link3"/>
|
||||
<exclude body1="panda_link3" body2="panda_link4"/>
|
||||
<exclude body1="panda_link4" body2="panda_link5"/>
|
||||
<exclude body1="panda_link5" body2="panda_link6"/>
|
||||
<exclude body1="panda_link6" body2="panda_link7"/>
|
||||
<exclude body1="panda_link7" body2="panda_link8"/>
|
||||
<exclude body1="panda_link8" body2="panda_hand"/>
|
||||
</contact>
|
||||
<visual>
|
||||
<map zfar="1000" znear="0.001"/>
|
||||
</visual>
|
||||
<worldbody>
|
||||
<body name="panda_link0" pos="0 0 0">
|
||||
<inertial diaginertia="0.0126801 0.0117603 0.00856656" mass="3.01399" pos="-0.0291898 -0.000879465 0.0566032" quat="0.00411744 0.564916 0.0132875 0.825031"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link0v" name="panda_link0:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link0v" name="panda_link0:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link1" pos="0 0 0.333">
|
||||
<inertial diaginertia="0.0164224 0.0153969 0.00546286" mass="2.77281" pos="1.1399e-05 -0.0312655 -0.0693733" quat="0.98466 0.174481 -0.000101815 0.000347662"/>
|
||||
<joint axis="0 0 1" damping="300" limited="true" name="panda_joint1" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link1v" name="panda_joint1:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link1v" name="panda_joint1:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link2" pos="0 0 0" quat="0.707107 -0.707107 0 0">
|
||||
<inertial diaginertia="0.016787 0.0157415 0.00553027" mass="2.7996" pos="-1.31766e-05 -0.0703216 0.0311782" quat="0.57484 0.818266 -6.05764e-05 -6.61626e-05"/>
|
||||
<joint axis="0 0 1" damping="300" limited="true" name="panda_joint2" pos="0 0 0" range="-1.8326 1.8326"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link2v" name="panda_joint2:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link2v" name="panda_joint2:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link3" pos="0 -0.316 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.00915257 0.00896477 0.00384742" mass="2.14603" pos="0.0443483 0.0249283 -0.03813" quat="0.0615263 0.349824 0.234291 0.904956"/>
|
||||
<joint axis="0 0 1" damping="300" limited="true" name="panda_joint3" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link3v" name="panda_joint3:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link3v" name="panda_joint3:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link4" pos="0.0825 0 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.00946899 0.00928491 0.00396694" mass="2.18807" pos="-0.0385503 0.0395256 0.0247162" quat="0.813566 0.465041 0.309792 0.160858"/>
|
||||
<joint axis="0 0 1" damping="300" limited="true" name="panda_joint4" pos="0 0 0" range="-3.1416 0.0873"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link4v" name="panda_link4:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link4v" name="panda_link4:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link5" pos="-0.0825 0.384 0" quat="0.707107 -0.707107 0 0">
|
||||
<inertial diaginertia="0.0278873 0.0268823 0.00569569" mass="3.19545" pos="-6.36776e-05 0.0384124 -0.10997" quat="0.990767 -0.135571 0.000963106 0.000694406"/>
|
||||
<joint axis="0 0 1" damping="300" limited="true" name="panda_joint5" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link5v" name="panda_link5:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link5v" name="panda_link5:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link6" pos="0 0 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.00412168 0.0033698 0.00213304" mass="1.35761" pos="0.0510023 0.00693267 0.00616899" quat="-0.0460841 0.754362 0.044494 0.653325"/>
|
||||
<joint axis="0 0 1" damping="300" limited="true" name="panda_joint6" pos="0 0 0" range="-0.0873 3.8223"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link6v" name="panda_link6:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link6v" name="panda_link6:geom2" rgba="1 1 1 1" type="mesh"/>
|
||||
<body name="panda_link7" pos="0.088 0 0" quat="0.707107 0.707107 0 0">
|
||||
<inertial diaginertia="0.000637671 0.000528056 0.000279577" mass="0.417345" pos="0.0103614 0.0103596 0.0791078" quat="0.63547 0.278021 -0.670462 0.263369"/>
|
||||
<joint axis="0 0 1" damping="300" limited="true" name="panda_joint7" pos="0 0 0" range="-2.9671 2.9671"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="link7v" name="panda_link7:geom1" rgba="1 1 1 1" type="mesh"/>
|
||||
<geom mesh="link7v" name="panda_link7:geom2" rgba="1 1 1 1" solimp="1.998 1.999 0" type="mesh"/>
|
||||
<body name="panda_link8" pos="0 0 0.107">
|
||||
<inertial diaginertia="0.1 0.1 0.1" mass="0.1" pos="0 0 0"/>
|
||||
<body name="panda_hand" pos="0 0 0" quat="0.92388 0 0 -0.382683">
|
||||
<inertial diaginertia="0.00227632 0.00206087 0.000456542" mass="0.670782" pos="-2.76618e-06 -0.00061547 0.0239295" quat="0.697945 0.716151 -0.000242485 8.47563e-05"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="handv" name="panda_hand:geom1" type="mesh"/>
|
||||
<geom mesh="handv" name="panda_hand:geom2" solimp="1.998 1.999 0" type="mesh"/>
|
||||
<camera euler="0 3.14 0" fovy="60" ipd="0.0" mode="fixed" name="rgbd" pos="0.1 0.0 0."/>
|
||||
<body name="tcp" pos="0 0 0.105">
|
||||
<site name="tcp" rgba="'0 0 1 0'" size='0.001'/>
|
||||
</body>
|
||||
<body childclass="panda:gripper" name="panda_leftfinger" pos="0 0 0.0584">
|
||||
<inertial diaginertia="5.69661e-06 5.56035e-06 1.55183e-06" mass="0.0218754" pos="-2.42335e-05 0.0119585 0.0237816" quat="0.996177 0.0868631 -2.79377e-05 -0.00926642"/>
|
||||
<!-- <joint axis="0 1 0" limited="true" name="panda_finger_joint1" pos="0 0 0" range="0 0.04"-->
|
||||
<!-- type="slide" />-->
|
||||
<joint axis="0 1 0" name="panda_finger_joint1"/>
|
||||
<site name="panda_leftfinger:site" pos="0 0.012 0.045" rgba="0 0 1 0" size="0.012 0.015 0.012" type="box"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="fingerv" name="panda_leftfinger:geom1" type="mesh"/>
|
||||
<geom mesh="fingerv" name="panda_leftfinger:geom2" type="mesh"/>
|
||||
<body name="finger_joint1_tip" pos="0 0.0085 0.056">
|
||||
<inertial diaginertia="0.01 0.01 0.01" mass="0.01" pos="0 0 0" quat="0 0 0 1"/>
|
||||
<geom conaffinity="1" condim="4" contype="1" friction="2 0.05 0.0001" name="finger1_tip_collision" pos="0 -0.005 -0.012" quat="0 0 0 1" rgba="1 0 0 1" size="0.008 0.004 0.008" solref="0.01 0.5" type="box"/>
|
||||
</body>
|
||||
</body>
|
||||
<body childclass="panda:gripper" name="panda_rightfinger" pos="0 0 0.0584">
|
||||
<inertial diaginertia="5.69661e-06 5.56035e-06 1.55183e-06" mass="0.0218754" pos="2.42335e-05 -0.0119585 0.0237816" quat="0.996177 -0.0868631 2.79377e-05 -0.00926642"/>
|
||||
<joint axis="0 -1 0" name="panda_finger_joint2"/>
|
||||
<site name="panda_rightfinger:site" pos="0 -0.012 0.045" rgba="0 0 1 0" size="0.012 0.015 0.012" type="box"/>
|
||||
<geom conaffinity="0" contype="0" group="1" mesh="fingerv" name="panda_rightfinger:geom1" quat="0 0 0 1" type="mesh"/>
|
||||
<geom condim="4" mesh="fingerv" name="panda_rightfinger:geom2" quat="0 0 0 1" type="mesh"/>
|
||||
<body name="finger_joint2_tip" pos="0 -0.0085 0.056">
|
||||
<inertial diaginertia="0.01 0.01 0.01" mass="0.01" pos="0 0 0" quat="0 0 0 1"/>
|
||||
<geom conaffinity="1" condim="4" contype="1" friction="2 0.05 0.0001" name="finger2_tip_collision" pos="0 0.005 -0.012" quat="0 0 0 1" rgba="1 0 0 1" size="0.008 0.004 0.008" solref="0.01 0.5" type="box"/>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
</body>
|
||||
<camera euler="0 0 0" fovy="45" ipd="0.0" mode="fixed" name="rgbd_cage" pos="0.7 0.1 0.9"/>
|
||||
<body mocap="true" name="panda:mocap" pos="0 0 0">
|
||||
<geom conaffinity="0" contype="0" pos="0 0 0" rgba="0 0.5 0 0.7" size="0.005 0.005 0.005" type="box"/>
|
||||
<!-- <geom conaffinity="0" contype="0" pos="0 0 0" rgba="1 0 0 0.3" size="1 0.005 0.005" type="box" />-->
|
||||
<!-- <geom conaffinity="0" contype="0" pos="0 0 0" rgba="0 1 0 0.3" size="0.005 1 0.005" type="box" />-->
|
||||
<!-- <geom conaffinity="0" contype="0" pos="0 0 0" rgba="0 0 1 0.3" size="0.005 0.005 1" type="box" />-->
|
||||
</body>
|
||||
</worldbody>
|
||||
<equality>
|
||||
<weld body1="panda:mocap" body2="tcp" solref="0.001 1"/>
|
||||
</equality>
|
||||
<sensor>
|
||||
<touch name="touchsensor:left" site="panda_leftfinger:site"/>
|
||||
<touch name="touchsensor:right" site="panda_rightfinger:site"/>
|
||||
</sensor>
|
||||
<default>
|
||||
<default class="panda:gripper">
|
||||
<geom condim="4" friction="1 0.005 0.0001" margin="0.001" solimp="0.998 0.999 0.001" solref="0.02 1" type="box"/>
|
||||
<joint damping="10" limited="true" range="0 0.04" type="slide"/>
|
||||
</default>
|
||||
</default>
|
||||
<actuator>
|
||||
<position ctrllimited="true" ctrlrange="0.001 0.04" forcelimited="true" forcerange="-70 70"
|
||||
joint="panda_finger_joint1" kp="1000000" name="panda_finger_joint1_act"/>
|
||||
<position ctrllimited="true" ctrlrange="0.001 0.04" forcelimited="true" forcerange="-70 70"
|
||||
joint="panda_finger_joint2" kp="1000000" name="panda_finger_joint2_act"/>
|
||||
</actuator>
|
||||
</mujocoinclude>
|
@ -0,0 +1 @@
|
||||
<!--todo-->
|
@ -0,0 +1,19 @@
|
||||
<mujoco model="base_surrounding">
|
||||
<compiler angle="radian" discardvisual="false"/>
|
||||
<option collision="all" cone="elliptic" gravity="0 0 -9.81" impratio="3" solver="Newton" timestep="0.001"
|
||||
tolerance="1e-10"/>
|
||||
<size nconmax="2000" njmax="2000"/>
|
||||
<asset>
|
||||
<texture builtin="gradient" height="32" rgb1="0.26 0.58 0.51" rgb2="0.26 0.58 0.51" type="skybox" width="32"/>
|
||||
</asset>
|
||||
<visual>
|
||||
<map zfar="1000" znear="0.001"/>
|
||||
</visual>
|
||||
<worldbody>
|
||||
<light castshadow="true" cutoff="100" diffuse="1 1 1" dir="-0 0 -1.3" directional="true" exponent="1" pos="0 0 1.3"
|
||||
specular=".1 .1 .1"/>
|
||||
<body name="ground" pos="0 0 -0.94">
|
||||
<geom name="ground:geom1" rgba="0.26 0.58 0.51 1" size="0 0 1" type="plane"/>
|
||||
</body>
|
||||
</worldbody>
|
||||
</mujoco>
|
362
fancy_gym/envs/mujoco/box_pushing/box_pushing_env.py
Normal file
362
fancy_gym/envs/mujoco/box_pushing/box_pushing_env.py
Normal file
@ -0,0 +1,362 @@
|
||||
import os
|
||||
|
||||
import numpy as np
|
||||
from gym import utils, spaces
|
||||
from gym.envs.mujoco import MujocoEnv
|
||||
from fancy_gym.envs.mujoco.box_pushing.box_pushing_utils import rot_to_quat, get_quaternion_error, rotation_distance
|
||||
from fancy_gym.envs.mujoco.box_pushing.box_pushing_utils import q_max, q_min, q_dot_max, q_torque_max
|
||||
from fancy_gym.envs.mujoco.box_pushing.box_pushing_utils import desired_rod_quat
|
||||
|
||||
import mujoco
|
||||
|
||||
MAX_EPISODE_STEPS_BOX_PUSHING = 100
|
||||
|
||||
BOX_POS_BOUND = np.array([[0.3, -0.45, -0.01], [0.6, 0.45, -0.01]])
|
||||
|
||||
class BoxPushingEnvBase(MujocoEnv, utils.EzPickle):
|
||||
"""
|
||||
franka box pushing environment
|
||||
action space:
|
||||
normalized joints torque * 7 , range [-1, 1]
|
||||
observation space:
|
||||
|
||||
rewards:
|
||||
1. dense reward
|
||||
2. time-depend sparse reward
|
||||
3. time-spatial-depend sparse reward
|
||||
"""
|
||||
|
||||
def __init__(self, frame_skip: int = 10):
|
||||
utils.EzPickle.__init__(**locals())
|
||||
self._steps = 0
|
||||
self.init_qpos_box_pushing = np.array([0., 0., 0., -1.5, 0., 1.5, 0., 0., 0., 0.6, 0.45, 0.0, 1., 0., 0., 0.])
|
||||
self.init_qvel_box_pushing = np.zeros(15)
|
||||
self.frame_skip = frame_skip
|
||||
|
||||
self._q_max = q_max
|
||||
self._q_min = q_min
|
||||
self._q_dot_max = q_dot_max
|
||||
self._desired_rod_quat = desired_rod_quat
|
||||
|
||||
self._episode_energy = 0.
|
||||
MujocoEnv.__init__(self,
|
||||
model_path=os.path.join(os.path.dirname(__file__), "assets", "box_pushing.xml"),
|
||||
frame_skip=self.frame_skip,
|
||||
mujoco_bindings="mujoco")
|
||||
self.action_space = spaces.Box(low=-1, high=1, shape=(7,))
|
||||
|
||||
def step(self, action):
|
||||
action = 10 * np.clip(action, self.action_space.low, self.action_space.high)
|
||||
resultant_action = np.clip(action + self.data.qfrc_bias[:7].copy(), -q_torque_max, q_torque_max)
|
||||
|
||||
unstable_simulation = False
|
||||
|
||||
try:
|
||||
self.do_simulation(resultant_action, self.frame_skip)
|
||||
except Exception as e:
|
||||
print(e)
|
||||
unstable_simulation = True
|
||||
|
||||
self._steps += 1
|
||||
self._episode_energy += np.sum(np.square(action))
|
||||
|
||||
episode_end = True if self._steps >= MAX_EPISODE_STEPS_BOX_PUSHING else False
|
||||
|
||||
box_pos = self.data.body("box_0").xpos.copy()
|
||||
box_quat = self.data.body("box_0").xquat.copy()
|
||||
target_pos = self.data.body("replan_target_pos").xpos.copy()
|
||||
target_quat = self.data.body("replan_target_pos").xquat.copy()
|
||||
rod_tip_pos = self.data.site("rod_tip").xpos.copy()
|
||||
rod_quat = self.data.body("push_rod").xquat.copy()
|
||||
qpos = self.data.qpos[:7].copy()
|
||||
qvel = self.data.qvel[:7].copy()
|
||||
|
||||
if not unstable_simulation:
|
||||
reward = self._get_reward(episode_end, box_pos, box_quat, target_pos, target_quat,
|
||||
rod_tip_pos, rod_quat, qpos, qvel, action)
|
||||
else:
|
||||
reward = -50
|
||||
|
||||
obs = self._get_obs()
|
||||
box_goal_pos_dist = 0. if not episode_end else np.linalg.norm(box_pos - target_pos)
|
||||
box_goal_quat_dist = 0. if not episode_end else rotation_distance(box_quat, target_quat)
|
||||
infos = {
|
||||
'episode_end': episode_end,
|
||||
'box_goal_pos_dist': box_goal_pos_dist,
|
||||
'box_goal_rot_dist': box_goal_quat_dist,
|
||||
'episode_energy': 0. if not episode_end else self._episode_energy,
|
||||
'is_success': True if episode_end and box_goal_pos_dist < 0.05 and box_goal_quat_dist < 0.5 else False,
|
||||
'num_steps': self._steps
|
||||
}
|
||||
return obs, reward, episode_end, infos
|
||||
|
||||
def reset_model(self):
|
||||
# rest box to initial position
|
||||
self.set_state(self.init_qpos_box_pushing, self.init_qvel_box_pushing)
|
||||
box_init_pos = np.array([0.4, 0.3, -0.01, 0.0, 0.0, 0.0, 1.0])
|
||||
self.data.joint("box_joint").qpos = box_init_pos
|
||||
|
||||
# set target position
|
||||
box_target_pos = self.sample_context()
|
||||
while np.linalg.norm(box_target_pos[:2] - box_init_pos[:2]) < 0.3:
|
||||
box_target_pos = self.sample_context()
|
||||
# box_target_pos[0] = 0.4
|
||||
# box_target_pos[1] = -0.3
|
||||
# box_target_pos[-4:] = np.array([0.0, 0.0, 0.0, 1.0])
|
||||
self.model.body_pos[2] = box_target_pos[:3]
|
||||
self.model.body_quat[2] = box_target_pos[-4:]
|
||||
self.model.body_pos[3] = box_target_pos[:3]
|
||||
self.model.body_quat[3] = box_target_pos[-4:]
|
||||
|
||||
# set the robot to the right configuration (rod tip in the box)
|
||||
desired_tcp_pos = box_init_pos[:3] + np.array([0.0, 0.0, 0.15])
|
||||
desired_tcp_quat = np.array([0, 1, 0, 0])
|
||||
desired_joint_pos = self.calculateOfflineIK(desired_tcp_pos, desired_tcp_quat)
|
||||
self.data.qpos[:7] = desired_joint_pos
|
||||
|
||||
mujoco.mj_forward(self.model, self.data)
|
||||
self._steps = 0
|
||||
self._episode_energy = 0.
|
||||
|
||||
return self._get_obs()
|
||||
|
||||
def sample_context(self):
|
||||
pos = self.np_random.uniform(low=BOX_POS_BOUND[0], high=BOX_POS_BOUND[1])
|
||||
theta = self.np_random.uniform(low=0, high=np.pi * 2)
|
||||
quat = rot_to_quat(theta, np.array([0, 0, 1]))
|
||||
return np.concatenate([pos, quat])
|
||||
|
||||
def _get_reward(self, episode_end, box_pos, box_quat, target_pos, target_quat,
|
||||
rod_tip_pos, rod_quat, qpos, qvel, action):
|
||||
raise NotImplementedError
|
||||
|
||||
def _get_obs(self):
|
||||
obs = np.concatenate([
|
||||
self.data.qpos[:7].copy(), # joint position
|
||||
self.data.qvel[:7].copy(), # joint velocity
|
||||
# self.data.qfrc_bias[:7].copy(), # joint gravity compensation
|
||||
# self.data.site("rod_tip").xpos.copy(), # position of rod tip
|
||||
# self.data.body("push_rod").xquat.copy(), # orientation of rod
|
||||
self.data.body("box_0").xpos.copy(), # position of box
|
||||
self.data.body("box_0").xquat.copy(), # orientation of box
|
||||
self.data.body("replan_target_pos").xpos.copy(), # position of target
|
||||
self.data.body("replan_target_pos").xquat.copy() # orientation of target
|
||||
])
|
||||
return obs
|
||||
|
||||
def _joint_limit_violate_penalty(self, qpos, qvel, enable_pos_limit=False, enable_vel_limit=False):
|
||||
penalty = 0.
|
||||
p_coeff = 1.
|
||||
v_coeff = 1.
|
||||
# q_limit
|
||||
if enable_pos_limit:
|
||||
higher_error = qpos - self._q_max
|
||||
lower_error = self._q_min - qpos
|
||||
penalty -= p_coeff * (abs(np.sum(higher_error[qpos > self._q_max])) +
|
||||
abs(np.sum(lower_error[qpos < self._q_min])))
|
||||
# q_dot_limit
|
||||
if enable_vel_limit:
|
||||
q_dot_error = abs(qvel) - abs(self._q_dot_max)
|
||||
penalty -= v_coeff * abs(np.sum(q_dot_error[q_dot_error > 0.]))
|
||||
return penalty
|
||||
|
||||
def get_body_jacp(self, name):
|
||||
id = mujoco.mj_name2id(self.model, 1, name)
|
||||
jacp = np.zeros((3, self.model.nv))
|
||||
mujoco.mj_jacBody(self.model, self.data, jacp, None, id)
|
||||
return jacp
|
||||
|
||||
def get_body_jacr(self, name):
|
||||
id = mujoco.mj_name2id(self.model, 1, name)
|
||||
jacr = np.zeros((3, self.model.nv))
|
||||
mujoco.mj_jacBody(self.model, self.data, None, jacr, id)
|
||||
return jacr
|
||||
|
||||
def calculateOfflineIK(self, desired_cart_pos, desired_cart_quat):
|
||||
"""
|
||||
calculate offline inverse kinematics for franka pandas
|
||||
:param desired_cart_pos: desired cartesian position of tool center point
|
||||
:param desired_cart_quat: desired cartesian quaternion of tool center point
|
||||
:return: joint angles
|
||||
"""
|
||||
J_reg = 1e-6
|
||||
w = np.diag([1, 1, 1, 1, 1, 1, 1])
|
||||
target_theta_null = np.array([
|
||||
3.57795216e-09,
|
||||
1.74532920e-01,
|
||||
3.30500960e-08,
|
||||
-8.72664630e-01,
|
||||
-1.14096181e-07,
|
||||
1.22173047e00,
|
||||
7.85398126e-01])
|
||||
eps = 1e-5 # threshold for convergence
|
||||
IT_MAX = 1000
|
||||
dt = 1e-3
|
||||
i = 0
|
||||
pgain = [
|
||||
33.9403713446798,
|
||||
30.9403713446798,
|
||||
33.9403713446798,
|
||||
27.69370238555632,
|
||||
33.98706171459314,
|
||||
30.9185531893281,
|
||||
]
|
||||
pgain_null = 5 * np.array([
|
||||
7.675519770796831,
|
||||
2.676935478437176,
|
||||
8.539040163444975,
|
||||
1.270446361314313,
|
||||
8.87752182480855,
|
||||
2.186782233762969,
|
||||
4.414432577659688,
|
||||
])
|
||||
pgain_limit = 20
|
||||
q = self.data.qpos[:7].copy()
|
||||
qd_d = np.zeros(q.shape)
|
||||
old_err_norm = np.inf
|
||||
|
||||
while True:
|
||||
q_old = q
|
||||
q = q + dt * qd_d
|
||||
q = np.clip(q, q_min, q_max)
|
||||
self.data.qpos[:7] = q
|
||||
mujoco.mj_forward(self.model, self.data)
|
||||
current_cart_pos = self.data.body("tcp").xpos.copy()
|
||||
current_cart_quat = self.data.body("tcp").xquat.copy()
|
||||
|
||||
cart_pos_error = np.clip(desired_cart_pos - current_cart_pos, -0.1, 0.1)
|
||||
|
||||
if np.linalg.norm(current_cart_quat - desired_cart_quat) > np.linalg.norm(current_cart_quat + desired_cart_quat):
|
||||
current_cart_quat = -current_cart_quat
|
||||
cart_quat_error = np.clip(get_quaternion_error(current_cart_quat, desired_cart_quat), -0.5, 0.5)
|
||||
|
||||
err = np.hstack((cart_pos_error, cart_quat_error))
|
||||
err_norm = np.sum(cart_pos_error**2) + np.sum((current_cart_quat - desired_cart_quat)**2)
|
||||
if err_norm > old_err_norm:
|
||||
q = q_old
|
||||
dt = 0.7 * dt
|
||||
continue
|
||||
else:
|
||||
dt = 1.025 * dt
|
||||
|
||||
if err_norm < eps:
|
||||
break
|
||||
if i > IT_MAX:
|
||||
break
|
||||
|
||||
old_err_norm = err_norm
|
||||
|
||||
### get Jacobian by mujoco
|
||||
self.data.qpos[:7] = q
|
||||
mujoco.mj_forward(self.model, self.data)
|
||||
|
||||
jacp = self.get_body_jacp("tcp")[:, :7].copy()
|
||||
jacr = self.get_body_jacr("tcp")[:, :7].copy()
|
||||
|
||||
J = np.concatenate((jacp, jacr), axis=0)
|
||||
|
||||
Jw = J.dot(w)
|
||||
|
||||
# J * W * J.T + J_reg * I
|
||||
JwJ_reg = Jw.dot(J.T) + J_reg * np.eye(J.shape[0])
|
||||
|
||||
# Null space velocity, points to home position
|
||||
qd_null = pgain_null * (target_theta_null - q)
|
||||
|
||||
margin_to_limit = 0.1
|
||||
qd_null_limit = np.zeros(qd_null.shape)
|
||||
qd_null_limit_max = pgain_limit * (q_max - margin_to_limit - q)
|
||||
qd_null_limit_min = pgain_limit * (q_min + margin_to_limit - q)
|
||||
qd_null_limit[q > q_max - margin_to_limit] += qd_null_limit_max[q > q_max - margin_to_limit]
|
||||
qd_null_limit[q < q_min + margin_to_limit] += qd_null_limit_min[q < q_min + margin_to_limit]
|
||||
qd_null += qd_null_limit
|
||||
|
||||
# W J.T (J W J' + reg I)^-1 xd_d + (I - W J.T (J W J' + reg I)^-1 J qd_null
|
||||
qd_d = np.linalg.solve(JwJ_reg, pgain * err - J.dot(qd_null))
|
||||
|
||||
qd_d = w.dot(J.transpose()).dot(qd_d) + qd_null
|
||||
|
||||
i += 1
|
||||
|
||||
return q
|
||||
|
||||
class BoxPushingDense(BoxPushingEnvBase):
|
||||
def __init__(self, frame_skip: int = 10):
|
||||
super(BoxPushingDense, self).__init__(frame_skip=frame_skip)
|
||||
def _get_reward(self, episode_end, box_pos, box_quat, target_pos, target_quat,
|
||||
rod_tip_pos, rod_quat, qpos, qvel, action):
|
||||
joint_penalty = self._joint_limit_violate_penalty(qpos,
|
||||
qvel,
|
||||
enable_pos_limit=True,
|
||||
enable_vel_limit=True)
|
||||
tcp_box_dist_reward = -2 * np.clip(np.linalg.norm(box_pos - rod_tip_pos), 0.05, 100)
|
||||
box_goal_pos_dist_reward = -3.5 * np.linalg.norm(box_pos - target_pos)
|
||||
box_goal_rot_dist_reward = -rotation_distance(box_quat, target_quat) / np.pi
|
||||
energy_cost = -0.0005 * np.sum(np.square(action))
|
||||
|
||||
reward = joint_penalty + tcp_box_dist_reward + \
|
||||
box_goal_pos_dist_reward + box_goal_rot_dist_reward + energy_cost
|
||||
|
||||
rod_inclined_angle = rotation_distance(rod_quat, self._desired_rod_quat)
|
||||
if rod_inclined_angle > np.pi / 4:
|
||||
reward -= rod_inclined_angle / (np.pi)
|
||||
|
||||
return reward
|
||||
|
||||
class BoxPushingTemporalSparse(BoxPushingEnvBase):
|
||||
def __init__(self, frame_skip: int = 10):
|
||||
super(BoxPushingTemporalSparse, self).__init__(frame_skip=frame_skip)
|
||||
|
||||
def _get_reward(self, episode_end, box_pos, box_quat, target_pos, target_quat,
|
||||
rod_tip_pos, rod_quat, qpos, qvel, action):
|
||||
reward = 0.
|
||||
joint_penalty = self._joint_limit_violate_penalty(qpos, qvel, enable_pos_limit=True, enable_vel_limit=True)
|
||||
energy_cost = -0.0005 * np.sum(np.square(action))
|
||||
tcp_box_dist_reward = -2 * np.clip(np.linalg.norm(box_pos - rod_tip_pos), 0.05, 100)
|
||||
reward += joint_penalty + tcp_box_dist_reward + energy_cost
|
||||
rod_inclined_angle = rotation_distance(rod_quat, desired_rod_quat)
|
||||
|
||||
if rod_inclined_angle > np.pi / 4:
|
||||
reward -= rod_inclined_angle / (np.pi)
|
||||
|
||||
if not episode_end:
|
||||
return reward
|
||||
|
||||
box_goal_dist = np.linalg.norm(box_pos - target_pos)
|
||||
|
||||
box_goal_pos_dist_reward = -3.5 * box_goal_dist * 100
|
||||
box_goal_rot_dist_reward = -rotation_distance(box_quat, target_quat) / np.pi * 100
|
||||
|
||||
reward += box_goal_pos_dist_reward + box_goal_rot_dist_reward
|
||||
|
||||
return reward
|
||||
|
||||
class BoxPushingTemporalSpatialSparse(BoxPushingEnvBase):
|
||||
|
||||
def __init__(self, frame_skip: int = 10):
|
||||
super(BoxPushingTemporalSpatialSparse, self).__init__(frame_skip=frame_skip)
|
||||
|
||||
def _get_reward(self, episode_end, box_pos, box_quat, target_pos, target_quat,
|
||||
rod_tip_pos, rod_quat, qpos, qvel, action):
|
||||
reward = 0.
|
||||
joint_penalty = self._joint_limit_violate_penalty(qpos, qvel, enable_pos_limit=True, enable_vel_limit=True)
|
||||
energy_cost = -0.0005 * np.sum(np.square(action))
|
||||
tcp_box_dist_reward = -2 * np.clip(np.linalg.norm(box_pos - rod_tip_pos), 0.05, 100)
|
||||
reward += joint_penalty + tcp_box_dist_reward + energy_cost
|
||||
rod_inclined_angle = rotation_distance(rod_quat, desired_rod_quat)
|
||||
|
||||
if rod_inclined_angle > np.pi / 4:
|
||||
reward -= rod_inclined_angle / (np.pi)
|
||||
|
||||
if not episode_end:
|
||||
return reward
|
||||
|
||||
box_goal_dist = np.linalg.norm(box_pos - target_pos)
|
||||
|
||||
if box_goal_dist < 0.1:
|
||||
reward += 300
|
||||
box_goal_pos_dist_reward = np.clip(- 3.5 * box_goal_dist * 100 * 3, -100, 0)
|
||||
box_goal_rot_dist_reward = np.clip(- rotation_distance(box_quat, target_quat)/np.pi * 100 * 1.5, -100, 0)
|
||||
reward += box_goal_pos_dist_reward + box_goal_rot_dist_reward
|
||||
|
||||
return reward
|
53
fancy_gym/envs/mujoco/box_pushing/box_pushing_utils.py
Normal file
53
fancy_gym/envs/mujoco/box_pushing/box_pushing_utils.py
Normal file
@ -0,0 +1,53 @@
|
||||
import numpy as np
|
||||
|
||||
|
||||
# joint constraints for Franka robot
|
||||
q_max = np.array([2.8973, 1.7628, 2.8973, -0.0698, 2.8973, 3.7525, 2.8973])
|
||||
q_min = np.array([-2.8973, -1.7628, -2.8973, -3.0718, -2.8973, -0.0175, -2.8973])
|
||||
|
||||
q_dot_max = np.array([2.1750, 2.1750, 2.1750, 2.1750, 2.6100, 2.6100, 2.6100])
|
||||
q_torque_max = np.array([90., 90., 90., 90., 12., 12., 12.])
|
||||
#
|
||||
desired_rod_quat = np.array([0.0, 1.0, 0.0, 0.0])
|
||||
|
||||
def skew(x):
|
||||
"""
|
||||
Returns the skew-symmetric matrix of x
|
||||
param x: 3x1 vector
|
||||
"""
|
||||
return np.array([[0, -x[2], x[1]], [x[2], 0, -x[0]], [-x[1], x[0], 0]])
|
||||
|
||||
def get_quaternion_error(curr_quat, des_quat):
|
||||
"""
|
||||
Calculates the difference between the current quaternion and the desired quaternion.
|
||||
See Siciliano textbook page 140 Eq 3.91
|
||||
|
||||
param curr_quat: current quaternion
|
||||
param des_quat: desired quaternion
|
||||
return: difference between current quaternion and desired quaternion
|
||||
"""
|
||||
return curr_quat[0] * des_quat[1:] - des_quat[0] * curr_quat[1:] - skew(des_quat[1:]) @ curr_quat[1:]
|
||||
|
||||
def rotation_distance(p: np.array, q: np.array):
|
||||
"""
|
||||
Calculates the rotation angular between two quaternions
|
||||
param p: quaternion
|
||||
param q: quaternion
|
||||
theta: rotation angle between p and q (rad)
|
||||
"""
|
||||
assert p.shape == q.shape, "p and q should be quaternion"
|
||||
theta = 2 * np.arccos(abs(p @ q))
|
||||
return theta
|
||||
|
||||
|
||||
def rot_to_quat(theta, axis):
|
||||
"""
|
||||
Converts rotation angle along an axis to quaternion
|
||||
param theta: rotation angle (rad)
|
||||
param axis: rotation axis
|
||||
return: quaternion
|
||||
"""
|
||||
quant = np.zeros(4)
|
||||
quant[0] = np.sin(theta / 2.)
|
||||
quant[1:] = np.cos(theta / 2.) * axis
|
||||
return quant
|
29
fancy_gym/envs/mujoco/box_pushing/mp_wrapper.py
Normal file
29
fancy_gym/envs/mujoco/box_pushing/mp_wrapper.py
Normal file
@ -0,0 +1,29 @@
|
||||
from typing import Union, Tuple
|
||||
|
||||
import numpy as np
|
||||
|
||||
from fancy_gym.black_box.raw_interface_wrapper import RawInterfaceWrapper
|
||||
|
||||
|
||||
class MPWrapper(RawInterfaceWrapper):
|
||||
|
||||
# Random x goal + random init pos
|
||||
@property
|
||||
def context_mask(self):
|
||||
return np.hstack([
|
||||
[False] * 7, # joints position
|
||||
[False] * 7, # joints velocity
|
||||
[False] * 3, # position of box
|
||||
[False] * 4, # orientation of box
|
||||
[True] * 3, # position of target
|
||||
[True] * 4, # orientation of target
|
||||
# [True] * 1, # time
|
||||
])
|
||||
|
||||
@property
|
||||
def current_pos(self) -> Union[float, int, np.ndarray, Tuple]:
|
||||
return self.data.qpos[:7].copy()
|
||||
|
||||
@property
|
||||
def current_vel(self) -> Union[float, int, np.ndarray, Tuple]:
|
||||
return self.data.qvel[:7].copy()
|
62
fancy_gym/examples/example_replanning_envs.py
Normal file
62
fancy_gym/examples/example_replanning_envs.py
Normal file
@ -0,0 +1,62 @@
|
||||
import fancy_gym
|
||||
|
||||
def example_run_replanning_env(env_name="BoxPushingDenseReplanProDMP-v0", seed=1, iterations=1, render=False):
|
||||
env = fancy_gym.make(env_name, seed=seed)
|
||||
env.reset()
|
||||
for i in range(iterations):
|
||||
done = False
|
||||
while done is False:
|
||||
ac = env.action_space.sample()
|
||||
obs, reward, done, info = env.step(ac)
|
||||
if render:
|
||||
env.render(mode="human")
|
||||
if done:
|
||||
env.reset()
|
||||
env.close()
|
||||
del env
|
||||
|
||||
def example_custom_replanning_envs(seed=0, iteration=100, render=True):
|
||||
# id for a step-based environment
|
||||
base_env_id = "BoxPushingDense-v0"
|
||||
|
||||
wrappers = [fancy_gym.envs.mujoco.box_pushing.mp_wrapper.MPWrapper]
|
||||
|
||||
trajectory_generator_kwargs = {'trajectory_generator_type': 'prodmp',
|
||||
'weight_scale': 1}
|
||||
phase_generator_kwargs = {'phase_generator_type': 'exp'}
|
||||
controller_kwargs = {'controller_type': 'velocity'}
|
||||
basis_generator_kwargs = {'basis_generator_type': 'prodmp',
|
||||
'num_basis': 5}
|
||||
|
||||
# max_planning_times: the maximum number of plans can be generated
|
||||
# replanning_schedule: the trigger for replanning
|
||||
# condition_on_desired: use desired state as the boundary condition for the next plan
|
||||
black_box_kwargs = {'max_planning_times': 4,
|
||||
'replanning_schedule': lambda pos, vel, obs, action, t: t % 25 == 0,
|
||||
'condition_on_desired': True}
|
||||
|
||||
env = fancy_gym.make_bb(env_id=base_env_id, wrappers=wrappers, black_box_kwargs=black_box_kwargs,
|
||||
traj_gen_kwargs=trajectory_generator_kwargs, controller_kwargs=controller_kwargs,
|
||||
phase_kwargs=phase_generator_kwargs, basis_kwargs=basis_generator_kwargs,
|
||||
seed=seed)
|
||||
if render:
|
||||
env.render(mode="human")
|
||||
|
||||
obs = env.reset()
|
||||
|
||||
for i in range(iteration):
|
||||
ac = env.action_space.sample()
|
||||
obs, reward, done, info = env.step(ac)
|
||||
if done:
|
||||
env.reset()
|
||||
|
||||
env.close()
|
||||
del env
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
# run a registered replanning environment
|
||||
example_run_replanning_env(env_name="BoxPushingDenseReplanProDMP-v0", seed=1, iterations=1, render=False)
|
||||
|
||||
# run a custom replanning environment
|
||||
example_custom_replanning_envs(seed=0, iteration=8, render=True)
|
@ -24,7 +24,7 @@ def example_mp(env_name="HoleReacherProMP-v0", seed=1, iterations=1, render=True
|
||||
# number of samples/full trajectories (multiple environment steps)
|
||||
for i in range(iterations):
|
||||
|
||||
if render and i % 2 == 0:
|
||||
if render and i % 1 == 0:
|
||||
# This renders the full MP trajectory
|
||||
# It is only required to call render() once in the beginning, which renders every consecutive trajectory.
|
||||
# Resetting to no rendering, can be achieved by render(mode=None).
|
||||
@ -33,7 +33,7 @@ def example_mp(env_name="HoleReacherProMP-v0", seed=1, iterations=1, render=True
|
||||
# Just make sure the correct mode is set before executing the step.
|
||||
env.render(mode="human")
|
||||
else:
|
||||
env.render(mode=None)
|
||||
env.render()
|
||||
|
||||
# Now the action space is not the raw action but the parametrization of the trajectory generator,
|
||||
# such as a ProMP
|
||||
@ -161,6 +161,10 @@ if __name__ == '__main__':
|
||||
|
||||
# ProMP
|
||||
example_mp("HoleReacherProMP-v0", seed=10, iterations=5, render=render)
|
||||
example_mp("BoxPushingTemporalSparseProMP-v0", seed=10, iterations=1, render=render)
|
||||
|
||||
# ProDMP
|
||||
example_mp("BoxPushingDenseReplanProDMP-v0", seed=10, iterations=4, render=render)
|
||||
|
||||
# Altered basis functions
|
||||
obs1 = example_custom_mp("Reacher5dProMP-v0", seed=10, iterations=1, render=render)
|
||||
|
@ -22,7 +22,7 @@ def example_mp(env_name, seed=1, render=True):
|
||||
if render and i % 2 == 0:
|
||||
env.render(mode="human")
|
||||
else:
|
||||
env.render(mode=None)
|
||||
env.render()
|
||||
ac = env.action_space.sample()
|
||||
obs, reward, done, info = env.step(ac)
|
||||
returns += reward
|
||||
|
8
setup.py
8
setup.py
@ -18,9 +18,9 @@ extras["all"] = list(set(itertools.chain.from_iterable(map(lambda group: extras[
|
||||
setup(
|
||||
author='Fabian Otto, Onur Celik',
|
||||
name='fancy_gym',
|
||||
version='0.3',
|
||||
version='0.2',
|
||||
classifiers=[
|
||||
'Development Status :: 4 - Beta',
|
||||
'Development Status :: 3 - Alpha',
|
||||
'Intended Audience :: Science/Research',
|
||||
'License :: OSI Approved :: MIT License',
|
||||
'Natural Language :: English',
|
||||
@ -34,8 +34,8 @@ setup(
|
||||
],
|
||||
extras_require=extras,
|
||||
install_requires=[
|
||||
'gym[mujoco]<0.25.0,>=0.24.0',
|
||||
'mp_pytorch @ git+https://github.com/ALRhub/MP_PyTorch.git@main'
|
||||
'gym[mujoco]<0.25.0,>=0.24.1',
|
||||
'mp_pytorch<=0.1.3'
|
||||
],
|
||||
packages=[package for package in find_packages() if package.startswith("fancy_gym")],
|
||||
package_data={
|
||||
|
@ -67,28 +67,32 @@ def test_missing_wrapper(env_id: str):
|
||||
fancy_gym.make_bb(env_id, [], {}, {}, {}, {}, {})
|
||||
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp'])
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp', 'prodmp'])
|
||||
def test_missing_local_state(mp_type: str):
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
|
||||
env = fancy_gym.make_bb('toy-v0', [RawInterfaceWrapper], {},
|
||||
{'trajectory_generator_type': mp_type},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': 'exp'},
|
||||
{'basis_generator_type': 'rbf'})
|
||||
{'basis_generator_type': basis_generator_type})
|
||||
env.reset()
|
||||
with pytest.raises(NotImplementedError):
|
||||
env.step(env.action_space.sample())
|
||||
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp'])
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp', 'prodmp'])
|
||||
@pytest.mark.parametrize('env_wrap', zip(ENV_IDS, WRAPPERS))
|
||||
@pytest.mark.parametrize('verbose', [1, 2])
|
||||
def test_verbosity(mp_type: str, env_wrap: Tuple[str, Type[RawInterfaceWrapper]], verbose: int):
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
|
||||
env_id, wrapper_class = env_wrap
|
||||
env = fancy_gym.make_bb(env_id, [wrapper_class], {'verbose': verbose},
|
||||
{'trajectory_generator_type': mp_type},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': 'exp'},
|
||||
{'basis_generator_type': 'rbf'})
|
||||
{'basis_generator_type': basis_generator_type})
|
||||
env.reset()
|
||||
info_keys = list(env.step(env.action_space.sample())[3].keys())
|
||||
|
||||
@ -104,15 +108,17 @@ def test_verbosity(mp_type: str, env_wrap: Tuple[str, Type[RawInterfaceWrapper]]
|
||||
assert all(e in info_keys for e in mp_keys)
|
||||
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp'])
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp', 'prodmp'])
|
||||
@pytest.mark.parametrize('env_wrap', zip(ENV_IDS, WRAPPERS))
|
||||
def test_length(mp_type: str, env_wrap: Tuple[str, Type[RawInterfaceWrapper]]):
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
|
||||
env_id, wrapper_class = env_wrap
|
||||
env = fancy_gym.make_bb(env_id, [wrapper_class], {},
|
||||
{'trajectory_generator_type': mp_type},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': 'exp'},
|
||||
{'basis_generator_type': 'rbf'})
|
||||
{'basis_generator_type': basis_generator_type})
|
||||
|
||||
for _ in range(5):
|
||||
env.reset()
|
||||
@ -121,14 +127,15 @@ def test_length(mp_type: str, env_wrap: Tuple[str, Type[RawInterfaceWrapper]]):
|
||||
assert length == env.spec.max_episode_steps
|
||||
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp'])
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp', 'prodmp'])
|
||||
@pytest.mark.parametrize('reward_aggregation', [np.sum, np.mean, np.median, lambda x: np.mean(x[::2])])
|
||||
def test_aggregation(mp_type: str, reward_aggregation: Callable[[np.ndarray], float]):
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
env = fancy_gym.make_bb('toy-v0', [ToyWrapper], {'reward_aggregation': reward_aggregation},
|
||||
{'trajectory_generator_type': mp_type},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': 'exp'},
|
||||
{'basis_generator_type': 'rbf'})
|
||||
{'basis_generator_type': basis_generator_type})
|
||||
env.reset()
|
||||
# ToyEnv only returns 1 as reward
|
||||
assert env.step(env.action_space.sample())[1] == reward_aggregation(np.ones(50, ))
|
||||
@ -149,12 +156,13 @@ def test_context_space(mp_type: str, env_wrap: Tuple[str, Type[RawInterfaceWrapp
|
||||
assert env.observation_space.shape == wrapper.context_mask[wrapper.context_mask].shape
|
||||
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp'])
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp', 'prodmp'])
|
||||
@pytest.mark.parametrize('num_dof', [0, 1, 2, 5])
|
||||
@pytest.mark.parametrize('num_basis', [0, 1, 2, 5])
|
||||
@pytest.mark.parametrize('learn_tau', [True, False])
|
||||
@pytest.mark.parametrize('learn_delay', [True, False])
|
||||
def test_action_space(mp_type: str, num_dof: int, num_basis: int, learn_tau: bool, learn_delay: bool):
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
env = fancy_gym.make_bb('toy-v0', [ToyWrapper], {},
|
||||
{'trajectory_generator_type': mp_type,
|
||||
'action_dim': num_dof
|
||||
@ -164,28 +172,29 @@ def test_action_space(mp_type: str, num_dof: int, num_basis: int, learn_tau: boo
|
||||
'learn_tau': learn_tau,
|
||||
'learn_delay': learn_delay
|
||||
},
|
||||
{'basis_generator_type': 'rbf',
|
||||
{'basis_generator_type': basis_generator_type,
|
||||
'num_basis': num_basis
|
||||
})
|
||||
|
||||
base_dims = num_dof * num_basis
|
||||
additional_dims = num_dof if mp_type == 'dmp' else 0
|
||||
additional_dims = num_dof if 'dmp' in mp_type else 0
|
||||
traj_modification_dims = int(learn_tau) + int(learn_delay)
|
||||
assert env.action_space.shape[0] == base_dims + traj_modification_dims + additional_dims
|
||||
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp'])
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp', 'prodmp'])
|
||||
@pytest.mark.parametrize('a', [1])
|
||||
@pytest.mark.parametrize('b', [1.0])
|
||||
@pytest.mark.parametrize('c', [[1], [1.0], ['str'], [{'a': 'b'}], [np.ones(3, )]])
|
||||
@pytest.mark.parametrize('d', [{'a': 1}, {1: 2.0}, {'a': [1.0]}, {'a': np.ones(3, )}, {'a': {'a': 'b'}}])
|
||||
@pytest.mark.parametrize('e', [Object()])
|
||||
def test_change_env_kwargs(mp_type: str, a: int, b: float, c: list, d: dict, e: Object):
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
env = fancy_gym.make_bb('toy-v0', [ToyWrapper], {},
|
||||
{'trajectory_generator_type': mp_type},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': 'exp'},
|
||||
{'basis_generator_type': 'rbf'},
|
||||
{'basis_generator_type': basis_generator_type},
|
||||
a=a, b=b, c=c, d=d, e=e
|
||||
)
|
||||
assert a is env.a
|
||||
@ -196,18 +205,20 @@ def test_change_env_kwargs(mp_type: str, a: int, b: float, c: list, d: dict, e:
|
||||
assert e is env.e
|
||||
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp'])
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'prodmp'])
|
||||
@pytest.mark.parametrize('tau', [0.25, 0.5, 0.75, 1])
|
||||
def test_learn_tau(mp_type: str, tau: float):
|
||||
phase_generator_type = 'exp' if mp_type == 'prodmp' else 'linear'
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
env = fancy_gym.make_bb('toy-v0', [ToyWrapper], {'verbose': 2},
|
||||
{'trajectory_generator_type': mp_type,
|
||||
},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': 'linear',
|
||||
{'phase_generator_type': phase_generator_type,
|
||||
'learn_tau': True,
|
||||
'learn_delay': False
|
||||
},
|
||||
{'basis_generator_type': 'rbf',
|
||||
{'basis_generator_type': basis_generator_type,
|
||||
}, seed=SEED)
|
||||
|
||||
d = True
|
||||
@ -228,26 +239,29 @@ def test_learn_tau(mp_type: str, tau: float):
|
||||
vel = info['velocities'].flatten()
|
||||
|
||||
# Check end is all same (only true for linear basis)
|
||||
assert np.all(pos[tau_time_steps:] == pos[-1])
|
||||
assert np.all(vel[tau_time_steps:] == vel[-1])
|
||||
if phase_generator_type == "linear":
|
||||
assert np.all(pos[tau_time_steps:] == pos[-1])
|
||||
assert np.all(vel[tau_time_steps:] == vel[-1])
|
||||
|
||||
# Check active trajectory section is different to end values
|
||||
assert np.all(pos[:tau_time_steps - 1] != pos[-1])
|
||||
assert np.all(vel[:tau_time_steps - 2] != vel[-1])
|
||||
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp'])
|
||||
#
|
||||
#
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'prodmp'])
|
||||
@pytest.mark.parametrize('delay', [0, 0.25, 0.5, 0.75])
|
||||
def test_learn_delay(mp_type: str, delay: float):
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
phase_generator_type = 'exp' if mp_type == 'prodmp' else 'linear'
|
||||
env = fancy_gym.make_bb('toy-v0', [ToyWrapper], {'verbose': 2},
|
||||
{'trajectory_generator_type': mp_type,
|
||||
},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': 'linear',
|
||||
{'phase_generator_type': phase_generator_type,
|
||||
'learn_tau': False,
|
||||
'learn_delay': True
|
||||
},
|
||||
{'basis_generator_type': 'rbf',
|
||||
{'basis_generator_type': basis_generator_type,
|
||||
}, seed=SEED)
|
||||
|
||||
d = True
|
||||
@ -274,21 +288,23 @@ def test_learn_delay(mp_type: str, delay: float):
|
||||
# Check active trajectory section is different to beginning values
|
||||
assert np.all(pos[max(1, delay_time_steps):] != pos[0])
|
||||
assert np.all(vel[max(1, delay_time_steps)] != vel[0])
|
||||
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp'])
|
||||
#
|
||||
#
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'prodmp'])
|
||||
@pytest.mark.parametrize('tau', [0.25, 0.5, 0.75, 1])
|
||||
@pytest.mark.parametrize('delay', [0.25, 0.5, 0.75, 1])
|
||||
def test_learn_tau_and_delay(mp_type: str, tau: float, delay: float):
|
||||
phase_generator_type = 'exp' if mp_type == 'prodmp' else 'linear'
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
env = fancy_gym.make_bb('toy-v0', [ToyWrapper], {'verbose': 2},
|
||||
{'trajectory_generator_type': mp_type,
|
||||
},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': 'linear',
|
||||
{'phase_generator_type': phase_generator_type,
|
||||
'learn_tau': True,
|
||||
'learn_delay': True
|
||||
},
|
||||
{'basis_generator_type': 'rbf',
|
||||
{'basis_generator_type': basis_generator_type,
|
||||
}, seed=SEED)
|
||||
|
||||
if env.spec.max_episode_steps * env.dt < delay + tau:
|
||||
@ -315,8 +331,9 @@ def test_learn_tau_and_delay(mp_type: str, tau: float, delay: float):
|
||||
vel = info['velocities'].flatten()
|
||||
|
||||
# Check end is all same (only true for linear basis)
|
||||
assert np.all(pos[joint_time_steps:] == pos[-1])
|
||||
assert np.all(vel[joint_time_steps:] == vel[-1])
|
||||
if phase_generator_type == "linear":
|
||||
assert np.all(pos[joint_time_steps:] == pos[-1])
|
||||
assert np.all(vel[joint_time_steps:] == vel[-1])
|
||||
|
||||
# Check beginning is all same (only true for linear basis)
|
||||
assert np.all(pos[:delay_time_steps - 1] == pos[0])
|
||||
@ -326,4 +343,4 @@ def test_learn_tau_and_delay(mp_type: str, tau: float, delay: float):
|
||||
active_pos = pos[delay_time_steps: joint_time_steps - 1]
|
||||
active_vel = vel[delay_time_steps: joint_time_steps - 2]
|
||||
assert np.all(active_pos != pos[-1]) and np.all(active_pos != pos[0])
|
||||
assert np.all(active_vel != vel[-1]) and np.all(active_vel != vel[0])
|
||||
assert np.all(active_vel != vel[-1]) and np.all(active_vel != vel[0])
|
@ -98,7 +98,7 @@ def test_learn_sub_trajectories(mp_type: str, env_wrap: Tuple[str, Type[RawInter
|
||||
assert length <= np.round(env.traj_gen.tau.numpy() / env.dt)
|
||||
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp'])
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'dmp', 'prodmp'])
|
||||
@pytest.mark.parametrize('env_wrap', zip(ENV_IDS, WRAPPERS))
|
||||
@pytest.mark.parametrize('add_time_aware_wrapper_before', [True, False])
|
||||
@pytest.mark.parametrize('replanning_time', [10, 100, 1000])
|
||||
@ -114,11 +114,14 @@ def test_replanning_time(mp_type: str, env_wrap: Tuple[str, Type[RawInterfaceWra
|
||||
|
||||
replanning_schedule = lambda c_pos, c_vel, obs, c_action, t: t % replanning_time == 0
|
||||
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
phase_generator_type = 'exp' if 'dmp' in mp_type else 'linear'
|
||||
|
||||
env = fancy_gym.make_bb(env_id, [wrapper_class], {'replanning_schedule': replanning_schedule, 'verbose': 2},
|
||||
{'trajectory_generator_type': mp_type},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': 'exp'},
|
||||
{'basis_generator_type': 'rbf'}, seed=SEED)
|
||||
{'phase_generator_type': phase_generator_type},
|
||||
{'basis_generator_type': basis_generator_type}, seed=SEED)
|
||||
|
||||
assert env.do_replanning
|
||||
assert callable(env.replanning_schedule)
|
||||
@ -142,3 +145,189 @@ def test_replanning_time(mp_type: str, env_wrap: Tuple[str, Type[RawInterfaceWra
|
||||
env.reset()
|
||||
|
||||
assert replanning_schedule(None, None, None, None, length)
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'prodmp'])
|
||||
@pytest.mark.parametrize('max_planning_times', [1, 2, 3, 4])
|
||||
@pytest.mark.parametrize('sub_segment_steps', [5, 10])
|
||||
def test_max_planning_times(mp_type: str, max_planning_times: int, sub_segment_steps: int):
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
phase_generator_type = 'exp' if mp_type == 'prodmp' else 'linear'
|
||||
env = fancy_gym.make_bb('toy-v0', [ToyWrapper],
|
||||
{'max_planning_times': max_planning_times,
|
||||
'replanning_schedule': lambda pos, vel, obs, action, t: t % sub_segment_steps == 0,
|
||||
'verbose': 2},
|
||||
{'trajectory_generator_type': mp_type,
|
||||
},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': phase_generator_type,
|
||||
'learn_tau': False,
|
||||
'learn_delay': False
|
||||
},
|
||||
{'basis_generator_type': basis_generator_type,
|
||||
},
|
||||
seed=SEED)
|
||||
_ = env.reset()
|
||||
d = False
|
||||
planning_times = 0
|
||||
while not d:
|
||||
_, _, d, _ = env.step(env.action_space.sample())
|
||||
planning_times += 1
|
||||
assert planning_times == max_planning_times
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'prodmp'])
|
||||
@pytest.mark.parametrize('max_planning_times', [1, 2, 3, 4])
|
||||
@pytest.mark.parametrize('sub_segment_steps', [5, 10])
|
||||
@pytest.mark.parametrize('tau', [0.5, 1.0, 1.5, 2.0])
|
||||
def test_replanning_with_learn_tau(mp_type: str, max_planning_times: int, sub_segment_steps: int, tau: float):
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
phase_generator_type = 'exp' if mp_type == 'prodmp' else 'linear'
|
||||
env = fancy_gym.make_bb('toy-v0', [ToyWrapper],
|
||||
{'replanning_schedule': lambda pos, vel, obs, action, t: t % sub_segment_steps == 0,
|
||||
'max_planning_times': max_planning_times,
|
||||
'verbose': 2},
|
||||
{'trajectory_generator_type': mp_type,
|
||||
},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': phase_generator_type,
|
||||
'learn_tau': True,
|
||||
'learn_delay': False
|
||||
},
|
||||
{'basis_generator_type': basis_generator_type,
|
||||
},
|
||||
seed=SEED)
|
||||
_ = env.reset()
|
||||
d = False
|
||||
planning_times = 0
|
||||
while not d:
|
||||
action = env.action_space.sample()
|
||||
action[0] = tau
|
||||
_, _, d, info = env.step(action)
|
||||
planning_times += 1
|
||||
assert planning_times == max_planning_times
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'prodmp'])
|
||||
@pytest.mark.parametrize('max_planning_times', [1, 2, 3, 4])
|
||||
@pytest.mark.parametrize('sub_segment_steps', [5, 10])
|
||||
@pytest.mark.parametrize('delay', [0.1, 0.25, 0.5, 0.75])
|
||||
def test_replanning_with_learn_delay(mp_type: str, max_planning_times: int, sub_segment_steps: int, delay: float):
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
phase_generator_type = 'exp' if mp_type == 'prodmp' else 'linear'
|
||||
env = fancy_gym.make_bb('toy-v0', [ToyWrapper],
|
||||
{'replanning_schedule': lambda pos, vel, obs, action, t: t % sub_segment_steps == 0,
|
||||
'max_planning_times': max_planning_times,
|
||||
'verbose': 2},
|
||||
{'trajectory_generator_type': mp_type,
|
||||
},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': phase_generator_type,
|
||||
'learn_tau': False,
|
||||
'learn_delay': True
|
||||
},
|
||||
{'basis_generator_type': basis_generator_type,
|
||||
},
|
||||
seed=SEED)
|
||||
_ = env.reset()
|
||||
d = False
|
||||
planning_times = 0
|
||||
while not d:
|
||||
action = env.action_space.sample()
|
||||
action[0] = delay
|
||||
_, _, d, info = env.step(action)
|
||||
|
||||
delay_time_steps = int(np.round(delay / env.dt))
|
||||
pos = info['positions'].flatten()
|
||||
vel = info['velocities'].flatten()
|
||||
|
||||
# Check beginning is all same (only true for linear basis)
|
||||
if planning_times == 0:
|
||||
assert np.all(pos[:max(1, delay_time_steps - 1)] == pos[0])
|
||||
assert np.all(vel[:max(1, delay_time_steps - 2)] == vel[0])
|
||||
|
||||
# only valid when delay < sub_segment_steps
|
||||
elif planning_times > 0 and delay_time_steps < sub_segment_steps:
|
||||
assert np.all(pos[1:max(1, delay_time_steps - 1)] != pos[0])
|
||||
assert np.all(vel[1:max(1, delay_time_steps - 2)] != vel[0])
|
||||
|
||||
# Check active trajectory section is different to beginning values
|
||||
assert np.all(pos[max(1, delay_time_steps):] != pos[0])
|
||||
assert np.all(vel[max(1, delay_time_steps)] != vel[0])
|
||||
|
||||
planning_times += 1
|
||||
|
||||
assert planning_times == max_planning_times
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'prodmp'])
|
||||
@pytest.mark.parametrize('max_planning_times', [1, 2, 3])
|
||||
@pytest.mark.parametrize('sub_segment_steps', [5, 10, 15])
|
||||
@pytest.mark.parametrize('delay', [0, 0.25, 0.5, 0.75])
|
||||
@pytest.mark.parametrize('tau', [0.5, 0.75, 1.0])
|
||||
def test_replanning_with_learn_delay_and_tau(mp_type: str, max_planning_times: int, sub_segment_steps: int,
|
||||
delay: float, tau: float):
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
phase_generator_type = 'exp' if mp_type == 'prodmp' else 'linear'
|
||||
env = fancy_gym.make_bb('toy-v0', [ToyWrapper],
|
||||
{'replanning_schedule': lambda pos, vel, obs, action, t: t % sub_segment_steps == 0,
|
||||
'max_planning_times': max_planning_times,
|
||||
'verbose': 2},
|
||||
{'trajectory_generator_type': mp_type,
|
||||
},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': phase_generator_type,
|
||||
'learn_tau': True,
|
||||
'learn_delay': True
|
||||
},
|
||||
{'basis_generator_type': basis_generator_type,
|
||||
},
|
||||
seed=SEED)
|
||||
_ = env.reset()
|
||||
d = False
|
||||
planning_times = 0
|
||||
while not d:
|
||||
action = env.action_space.sample()
|
||||
action[0] = tau
|
||||
action[1] = delay
|
||||
_, _, d, info = env.step(action)
|
||||
|
||||
delay_time_steps = int(np.round(delay / env.dt))
|
||||
|
||||
pos = info['positions'].flatten()
|
||||
vel = info['velocities'].flatten()
|
||||
|
||||
# Delay only applies to first planning time
|
||||
if planning_times == 0:
|
||||
# Check delay is applied
|
||||
assert np.all(pos[:max(1, delay_time_steps - 1)] == pos[0])
|
||||
assert np.all(vel[:max(1, delay_time_steps - 2)] == vel[0])
|
||||
# Check active trajectory section is different to beginning values
|
||||
assert np.all(pos[max(1, delay_time_steps):] != pos[0])
|
||||
assert np.all(vel[max(1, delay_time_steps)] != vel[0])
|
||||
|
||||
planning_times += 1
|
||||
|
||||
assert planning_times == max_planning_times
|
||||
|
||||
@pytest.mark.parametrize('mp_type', ['promp', 'prodmp'])
|
||||
@pytest.mark.parametrize('max_planning_times', [1, 2, 3, 4])
|
||||
@pytest.mark.parametrize('sub_segment_steps', [5, 10])
|
||||
def test_replanning_schedule(mp_type: str, max_planning_times: int, sub_segment_steps: int):
|
||||
basis_generator_type = 'prodmp' if mp_type == 'prodmp' else 'rbf'
|
||||
phase_generator_type = 'exp' if mp_type == 'prodmp' else 'linear'
|
||||
env = fancy_gym.make_bb('toy-v0', [ToyWrapper],
|
||||
{'max_planning_times': max_planning_times,
|
||||
'replanning_schedule': lambda pos, vel, obs, action, t: t % sub_segment_steps == 0,
|
||||
'verbose': 2},
|
||||
{'trajectory_generator_type': mp_type,
|
||||
},
|
||||
{'controller_type': 'motor'},
|
||||
{'phase_generator_type': phase_generator_type,
|
||||
'learn_tau': False,
|
||||
'learn_delay': False
|
||||
},
|
||||
{'basis_generator_type': basis_generator_type,
|
||||
},
|
||||
seed=SEED)
|
||||
_ = env.reset()
|
||||
d = False
|
||||
for i in range(max_planning_times):
|
||||
_, _, d, _ = env.step(env.action_space.sample())
|
||||
assert d
|
||||
|
@ -49,8 +49,8 @@ def run_env(env_id, iterations=None, seed=0, render=False):
|
||||
|
||||
if done:
|
||||
break
|
||||
|
||||
assert done, "Done flag is not True after end of episode."
|
||||
if not hasattr(env, "replanning_schedule"):
|
||||
assert done, "Done flag is not True after end of episode."
|
||||
observations.append(obs)
|
||||
env.close()
|
||||
del env
|
||||
|
Loading…
Reference in New Issue
Block a user