fancy_gym/alr_envs/alr/__init__.py

import numpy as np
from gym import register

from . import classic_control, mujoco
from .classic_control.hole_reacher.hole_reacher import HoleReacherEnv
from .classic_control.simple_reacher.simple_reacher import SimpleReacherEnv
from .classic_control.viapoint_reacher.viapoint_reacher import ViaPointReacherEnv
from .mujoco.ball_in_a_cup.ball_in_a_cup import ALRBallInACupEnv
from .mujoco.ball_in_a_cup.biac_pd import ALRBallInACupPDEnv
from .mujoco.reacher.alr_reacher import ALRReacherEnv
from .mujoco.reacher.balancing import BalancingEnv

from .mujoco.table_tennis.tt_gym import MAX_EPISODE_STEPS

ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS = {"DMP": [], "ProMP": []}

# Classic Control
## Simple Reacher
register(
    id='SimpleReacher-v0',
    entry_point='alr_envs.alr.classic_control:SimpleReacherEnv',
    max_episode_steps=200,
    kwargs={
        "n_links": 2,
    }
)

register(
    id='SimpleReacher-v1',
    entry_point='alr_envs.alr.classic_control:SimpleReacherEnv',
    max_episode_steps=200,
    kwargs={
        "n_links": 2,
        "random_start": False
    }
)

register(
    id='LongSimpleReacher-v0',
    entry_point='alr_envs.alr.classic_control:SimpleReacherEnv',
    max_episode_steps=200,
    kwargs={
        "n_links": 5,
    }
)

register(
    id='LongSimpleReacher-v1',
    entry_point='alr_envs.alr.classic_control:SimpleReacherEnv',
    max_episode_steps=200,
    kwargs={
        "n_links": 5,
        "random_start": False
    }
)

## Viapoint Reacher

register(
    id='ViaPointReacher-v0',
    entry_point='alr_envs.alr.classic_control:ViaPointReacherEnv',
    max_episode_steps=200,
    kwargs={
        "n_links": 5,
        "allow_self_collision": False,
        "collision_penalty": 1000
    }
)

## Hole Reacher
register(
    id='HoleReacher-v0',
    entry_point='alr_envs.alr.classic_control:HoleReacherEnv',
    max_episode_steps=200,
    kwargs={
        "n_links": 5,
        "random_start": True,
        "allow_self_collision": False,
        "allow_wall_collision": False,
        "hole_width": None,
        "hole_depth": 1,
        "hole_x": None,
        "collision_penalty": 100,
    }
)

register(
    id='HoleReacher-v1',
    entry_point='alr_envs.alr.classic_control:HoleReacherEnv',
    max_episode_steps=200,
    kwargs={
        "n_links": 5,
        "random_start": False,
        "allow_self_collision": False,
        "allow_wall_collision": False,
        "hole_width": 0.25,
        "hole_depth": 1,
        "hole_x": None,
        "collision_penalty": 100,
    }
)

register(
    id='HoleReacher-v2',
    entry_point='alr_envs.alr.classic_control:HoleReacherEnv',
    max_episode_steps=200,
    kwargs={
        "n_links": 5,
        "random_start": False,
        "allow_self_collision": False,
        "allow_wall_collision": False,
        "hole_width": 0.25,
        "hole_depth": 1,
        "hole_x": 2,
        "collision_penalty": 1,
    }
)

# Mujoco

## Reacher
register(
    id='ALRReacher-v0',
    entry_point='alr_envs.alr.mujoco:ALRReacherEnv',
    max_episode_steps=200,
    kwargs={
        "steps_before_reward": 0,
        "n_links": 5,
        "balance": False,
    }
)

register(
    id='ALRReacherSparse-v0',
    entry_point='alr_envs.alr.mujoco:ALRReacherEnv',
    max_episode_steps=200,
    kwargs={
        "steps_before_reward": 200,
        "n_links": 5,
        "balance": False,
    }
)

register(
    id='ALRReacherSparseBalanced-v0',
    entry_point='alr_envs.alr.mujoco:ALRReacherEnv',
    max_episode_steps=200,
    kwargs={
        "steps_before_reward": 200,
        "n_links": 5,
        "balance": True,
    }
)

register(
    id='ALRLongReacher-v0',
    entry_point='alr_envs.alr.mujoco:ALRReacherEnv',
    max_episode_steps=200,
    kwargs={
        "steps_before_reward": 0,
        "n_links": 7,
        "balance": False,
    }
)

register(
    id='ALRLongReacherSparse-v0',
    entry_point='alr_envs.alr.mujoco:ALRReacherEnv',
    max_episode_steps=200,
    kwargs={
        "steps_before_reward": 200,
        "n_links": 7,
        "balance": False,
    }
)

register(
    id='ALRLongReacherSparseBalanced-v0',
    entry_point='alr_envs.alr.mujoco:ALRReacherEnv',
    max_episode_steps=200,
    kwargs={
        "steps_before_reward": 200,
        "n_links": 7,
        "balance": True,
    }
)

## Balancing Reacher

register(
    id='Balancing-v0',
    entry_point='alr_envs.alr.mujoco:BalancingEnv',
    max_episode_steps=200,
    kwargs={
        "n_links": 5,
    }
)

## Table Tennis
register(id='TableTennis2DCtxt-v0',
         entry_point='alr_envs.alr.mujoco:TTEnvGym',
         max_episode_steps=MAX_EPISODE_STEPS,
         kwargs={'ctxt_dim': 2})

register(id='TableTennis2DCtxt-v1',
         entry_point='alr_envs.alr.mujoco:TTEnvGym',
         max_episode_steps=MAX_EPISODE_STEPS,
         kwargs={'ctxt_dim': 2, 'fixed_goal': True})

register(id='TableTennis4DCtxt-v0',
         entry_point='alr_envs.alr.mujoco:TTEnvGym',
         max_episode_steps=MAX_EPISODE_STEPS,
         kwargs={'ctxt_dim': 4})

## BeerPong
difficulties = ["simple", "intermediate", "hard", "hardest"]

for v, difficulty in enumerate(difficulties):
    register(
        id='ALRBeerPong-v{}'.format(v),
        entry_point='alr_envs.alr.mujoco:ALRBeerBongEnv',
        max_episode_steps=600,
        kwargs={
            "difficulty": difficulty,
            "reward_type": "staged",
        }
    )

# Motion Primitive Environments

## Simple Reacher
_versions = ["SimpleReacher-v0", "SimpleReacher-v1", "LongSimpleReacher-v0", "LongSimpleReacher-v1"]
for _v in _versions:
    _name = _v.split("-")
    _env_id = f'{_name[0]}DMP-{_name[1]}'
    register(
        id=_env_id,
        entry_point='alr_envs.utils.make_env_helpers:make_dmp_env_helper',
        # max_episode_steps=1,
        kwargs={
            "name": f"alr_envs:{_v}",
            "wrappers": [classic_control.simple_reacher.MPWrapper],
            "mp_kwargs": {
                "num_dof": 2 if "long" not in _v.lower() else 5,
                "num_basis": 5,
                "duration": 2,
                "alpha_phase": 2,
                "learn_goal": True,
                "policy_type": "motor",
                "weights_scale": 50,
                "policy_kwargs": {
                    "p_gains": .6,
                    "d_gains": .075
                }
            }
        }
    )
    ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["DMP"].append(_env_id)

    _env_id = f'{_name[0]}ProMP-{_name[1]}'
    register(
        id=_env_id,
        entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',
        kwargs={
            "name": f"alr_envs:{_v}",
            "wrappers": [classic_control.simple_reacher.MPWrapper],
            "mp_kwargs": {
                "num_dof": 2 if "long" not in _v.lower() else 5,
                "num_basis": 5,
                "duration": 2,
                "policy_type": "motor",
                "weights_scale": 1,
                "zero_start": True,
                "policy_kwargs": {
                    "p_gains": .6,
                    "d_gains": .075
                }
            }
        }
    )
    ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)

# Viapoint reacher
register(
    id='ViaPointReacherDMP-v0',
    entry_point='alr_envs.utils.make_env_helpers:make_dmp_env_helper',
    # max_episode_steps=1,
    kwargs={
        "name": "alr_envs:ViaPointReacher-v0",
        "wrappers": [classic_control.viapoint_reacher.MPWrapper],
        "mp_kwargs": {
            "num_dof": 5,
            "num_basis": 5,
            "duration": 2,
            "learn_goal": True,
            "alpha_phase": 2,
            "policy_type": "velocity",
            "weights_scale": 50,
        }
    }
)
ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["DMP"].append("ViaPointReacherDMP-v0")

register(
    id="ViaPointReacherProMP-v0",
    entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',
    kwargs={
        "name": f"alr_envs:ViaPointReacher-v0",
        "wrappers": [classic_control.viapoint_reacher.MPWrapper],
        "mp_kwargs": {
            "num_dof": 5,
            "num_basis": 5,
            "duration": 2,
            "policy_type": "velocity",
            "weights_scale": 1,
            "zero_start": True
        }
    }
)
ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append("ViaPointReacherProMP-v0")

## Hole Reacher
_versions = ["v0", "v1", "v2"]
for _v in _versions:
    _env_id = f'HoleReacherDMP-{_v}'
    register(
        id=_env_id,
        entry_point='alr_envs.utils.make_env_helpers:make_dmp_env_helper',
        # max_episode_steps=1,
        kwargs={
            "name": f"alr_envs:HoleReacher-{_v}",
            "wrappers": [classic_control.hole_reacher.MPWrapper],
            "mp_kwargs": {
                "num_dof": 5,
                "num_basis": 5,
                "duration": 2,
                "learn_goal": True,
                "alpha_phase": 2.5,
                "bandwidth_factor": 2,
                "policy_type": "velocity",
                "weights_scale": 50,
                "goal_scale": 0.1
            }
        }
    )
    ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["DMP"].append(_env_id)

    _env_id = f'HoleReacherProMP-{_v}'
    register(
        id=_env_id,
        entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',
        kwargs={
            "name": f"alr_envs:HoleReacher-{_v}",
            "wrappers": [classic_control.hole_reacher.MPWrapper],
            "mp_kwargs": {
                "num_dof": 5,
                "num_basis": 5,
                "duration": 2,
                "policy_type": "velocity",
                "weights_scale": 0.1,
                "zero_start": True
            }
        }
    )
    ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)
    
## ALRReacher
_versions = ["ALRReacher-v0", "ALRLongReacher-v0", "ALRReacherSparse-v0", "ALRLongReacherSparse-v0"]
for _v in _versions:
    _name = _v.split("-")
    _env_id = f'{_name[0]}DMP-{_name[1]}'
    register(
        id=_env_id,
        entry_point='alr_envs.utils.make_env_helpers:make_dmp_env_helper',
        # max_episode_steps=1,
        kwargs={
            "name": f"alr_envs:{_v}",
            "wrappers": [mujoco.reacher.MPWrapper],
            "mp_kwargs": {
                "num_dof": 5 if "long" not in _v.lower() else 7,
                "num_basis": 5,
                "duration": 4,
                "alpha_phase": 2,
                "learn_goal": True,
                "policy_type": "motor",
                "weights_scale": 1,
                "policy_kwargs": {
                    "p_gains": 1,
                    "d_gains": 0.1
                }
            }
        }
    )
    ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["DMP"].append(_env_id)

    _env_id = f'{_name[0]}ProMP-{_name[1]}'
    register(
        id=_env_id,
        entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',
        kwargs={
            "name": f"alr_envs:{_v}",
            "wrappers": [mujoco.reacher.MPWrapper],
            "mp_kwargs": {
                "num_dof": 5 if "long" not in _v.lower() else 7,
                "num_basis": 5,
                "duration": 4,
                "policy_type": "motor",
                "weights_scale": 1,
                "zero_start": True,
                "policy_kwargs": {
                    "p_gains": 1,
                    "d_gains": 0.1
                }
            }
        }
    )
    ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)

## Beerpong
_versions = ["v0", "v1", "v2", "v3"]
for _v in _versions:
    _env_id = f'BeerpongProMP-{_v}'
    register(
        id=_env_id,
        entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',
        kwargs={
            "name": f"alr_envs:ALRBeerPong-{_v}",
            "wrappers": [mujoco.beerpong.MPWrapper],
            "mp_kwargs": {
                "num_dof": 7,
                "num_basis": 2,
                "duration": 1,
                "post_traj_time": 2,
                "policy_type": "motor",
                "weights_scale": 1,
                "zero_start": True,
                "zero_goal": False,
                "policy_kwargs": {
                    "p_gains": np.array([       1.5,   5,   2.55,    3,   2.,    2,   1.25]),
                    "d_gains": np.array([0.02333333, 0.1, 0.0625, 0.08, 0.03, 0.03, 0.0125])
                }
            }
        }
    )
    ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)

## Table Tennis
ctxt_dim = [2, 4]
for _v, cd in enumerate(ctxt_dim):
    _env_id = f'TableTennisProMP-v{_v}'
    register(
        id=_env_id,
        entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',
        kwargs={
            "name": "alr_envs:TableTennis{}DCtxt-v0".format(cd),
            "wrappers": [mujoco.table_tennis.MPWrapper],
            "mp_kwargs": {
                "num_dof": 7,
                "num_basis": 2,
                "duration": 1.25,
                "post_traj_time": 4.5,
                "policy_type": "motor",
                "weights_scale": 1.0,
                "zero_start": True,
                "zero_goal": False,
                "policy_kwargs": {
                    "p_gains": 0.5*np.array([1.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0]),
                    "d_gains": 0.5*np.array([0.1, 0.4, 0.2, 0.4, 0.1, 0.4, 0.1])
                }
            }
        }
    )
    ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)

register(
    id='TableTennisProMP-v2',
    entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',
    kwargs={
        "name": "alr_envs:TableTennis2DCtxt-v1",
        "wrappers": [mujoco.table_tennis.MPWrapper],
        "mp_kwargs": {
            "num_dof": 7,
            "num_basis": 2,
            "duration": 1.,
            "post_traj_time": 2.5,
            "policy_type": "motor",
            "weights_scale": 1,
            "off": -0.05,
            "bandwidth_factor": 3.5,
            "zero_start": True,
            "zero_goal": False,
            "policy_kwargs": {
                "p_gains": 0.5*np.array([1.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0]),
                "d_gains": 0.5*np.array([0.1, 0.4, 0.2, 0.4, 0.1, 0.4, 0.1])
            }
        }
    }
)
ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append("TableTennisProMP-v2")
Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00			`import numpy as np`
improved project structure and exposed methods 2021-08-25 17:16:20 +02:00			`from gym import register`

			`from . import classic_control, mujoco`
			`from .classic_control.hole_reacher.hole_reacher import HoleReacherEnv`
			`from .classic_control.simple_reacher.simple_reacher import SimpleReacherEnv`
			`from .classic_control.viapoint_reacher.viapoint_reacher import ViaPointReacherEnv`
			`from .mujoco.ball_in_a_cup.ball_in_a_cup import ALRBallInACupEnv`
			`from .mujoco.ball_in_a_cup.biac_pd import ALRBallInACupPDEnv`
			`from .mujoco.reacher.alr_reacher import ALRReacherEnv`
			`from .mujoco.reacher.balancing import BalancingEnv`

Added ALRReacherProMP 2022-01-25 15:23:57 +01:00			`from .mujoco.table_tennis.tt_gym import MAX_EPISODE_STEPS`
Merge branch 'master' into deprecate_detpmp # Conflicts: # README.md # alr_envs/alr/__init__.py 2021-12-01 16:34:18 +01:00
replaced all detpmp with promp 2021-11-30 16:11:32 +01:00			`ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS = {"DMP": [], "ProMP": []}`
improved project structure and exposed methods 2021-08-25 17:16:20 +02:00
			`# Classic Control`
			`## Simple Reacher`
			`register(`
			`id='SimpleReacher-v0',`
			`entry_point='alr_envs.alr.classic_control:SimpleReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"n_links": 2,`
			`}`
			`)`

			`register(`
			`id='SimpleReacher-v1',`
			`entry_point='alr_envs.alr.classic_control:SimpleReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"n_links": 2,`
			`"random_start": False`
			`}`
			`)`

			`register(`
			`id='LongSimpleReacher-v0',`
			`entry_point='alr_envs.alr.classic_control:SimpleReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"n_links": 5,`
			`}`
			`)`

			`register(`
			`id='LongSimpleReacher-v1',`
			`entry_point='alr_envs.alr.classic_control:SimpleReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"n_links": 5,`
			`"random_start": False`
			`}`
			`)`

			`## Viapoint Reacher`

			`register(`
			`id='ViaPointReacher-v0',`
			`entry_point='alr_envs.alr.classic_control:ViaPointReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"n_links": 5,`
			`"allow_self_collision": False,`
			`"collision_penalty": 1000`
			`}`
			`)`

			`## Hole Reacher`
			`register(`
			`id='HoleReacher-v0',`
			`entry_point='alr_envs.alr.classic_control:HoleReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"n_links": 5,`
			`"random_start": True,`
			`"allow_self_collision": False,`
			`"allow_wall_collision": False,`
			`"hole_width": None,`
			`"hole_depth": 1,`
			`"hole_x": None,`
			`"collision_penalty": 100,`
			`}`
			`)`

			`register(`
			`id='HoleReacher-v1',`
reacher envs cleanup - base classes for direct and torque control - added promp wrapper support 2021-11-26 16:31:46 +01:00			`entry_point='alr_envs.alr.classic_control:HoleReacherEnv',`
improved project structure and exposed methods 2021-08-25 17:16:20 +02:00			`max_episode_steps=200,`
			`kwargs={`
			`"n_links": 5,`
			`"random_start": False,`
			`"allow_self_collision": False,`
			`"allow_wall_collision": False,`
			`"hole_width": 0.25,`
			`"hole_depth": 1,`
			`"hole_x": None,`
			`"collision_penalty": 100,`
			`}`
			`)`

			`register(`
			`id='HoleReacher-v2',`
			`entry_point='alr_envs.alr.classic_control:HoleReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"n_links": 5,`
			`"random_start": False,`
			`"allow_self_collision": False,`
			`"allow_wall_collision": False,`
			`"hole_width": 0.25,`
			`"hole_depth": 1,`
			`"hole_x": 2,`
reacher envs cleanup - base classes for direct and torque control - added promp wrapper support 2021-11-26 16:31:46 +01:00			`"collision_penalty": 1,`
improved project structure and exposed methods 2021-08-25 17:16:20 +02:00			`}`
			`)`

			`# Mujoco`

			`## Reacher`
			`register(`
			`id='ALRReacher-v0',`
			`entry_point='alr_envs.alr.mujoco:ALRReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"steps_before_reward": 0,`
			`"n_links": 5,`
			`"balance": False,`
			`}`
			`)`

			`register(`
			`id='ALRReacherSparse-v0',`
			`entry_point='alr_envs.alr.mujoco:ALRReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"steps_before_reward": 200,`
			`"n_links": 5,`
			`"balance": False,`
			`}`
			`)`

			`register(`
			`id='ALRReacherSparseBalanced-v0',`
			`entry_point='alr_envs.alr.mujoco:ALRReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"steps_before_reward": 200,`
			`"n_links": 5,`
			`"balance": True,`
			`}`
			`)`

			`register(`
			`id='ALRLongReacher-v0',`
			`entry_point='alr_envs.alr.mujoco:ALRReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"steps_before_reward": 0,`
			`"n_links": 7,`
			`"balance": False,`
			`}`
			`)`

			`register(`
			`id='ALRLongReacherSparse-v0',`
			`entry_point='alr_envs.alr.mujoco:ALRReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"steps_before_reward": 200,`
			`"n_links": 7,`
			`"balance": False,`
			`}`
			`)`

			`register(`
			`id='ALRLongReacherSparseBalanced-v0',`
			`entry_point='alr_envs.alr.mujoco:ALRReacherEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"steps_before_reward": 200,`
			`"n_links": 7,`
			`"balance": True,`
			`}`
			`)`

			`## Balancing Reacher`

			`register(`
			`id='Balancing-v0',`
			`entry_point='alr_envs.alr.mujoco:BalancingEnv',`
			`max_episode_steps=200,`
			`kwargs={`
			`"n_links": 5,`
			`}`
			`)`

Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00			`## Table Tennis`
			`register(id='TableTennis2DCtxt-v0',`
updated table tennis and beerpong for promp usage 2021-12-06 13:43:45 +01:00			`entry_point='alr_envs.alr.mujoco:TTEnvGym',`
Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00			`max_episode_steps=MAX_EPISODE_STEPS,`
updated table tennis and beerpong for promp usage 2021-12-06 13:43:45 +01:00			`kwargs={'ctxt_dim': 2})`

			`register(id='TableTennis2DCtxt-v1',`
			`entry_point='alr_envs.alr.mujoco:TTEnvGym',`
small bp and tt updates 2021-12-07 14:46:31 +01:00			`max_episode_steps=MAX_EPISODE_STEPS,`
updated table tennis and beerpong for promp usage 2021-12-06 13:43:45 +01:00			`kwargs={'ctxt_dim': 2, 'fixed_goal': True})`
Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00
			`register(id='TableTennis4DCtxt-v0',`
updated table tennis and beerpong for promp usage 2021-12-06 13:43:45 +01:00			`entry_point='alr_envs.alr.mujoco:TTEnvGym',`
Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00			`max_episode_steps=MAX_EPISODE_STEPS,`
updated table tennis and beerpong for promp usage 2021-12-06 13:43:45 +01:00			`kwargs={'ctxt_dim': 4})`
Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00
			`## BeerPong`
			`difficulties = ["simple", "intermediate", "hard", "hardest"]`

			`for v, difficulty in enumerate(difficulties):`
			`register(`
			`id='ALRBeerPong-v{}'.format(v),`
			`entry_point='alr_envs.alr.mujoco:ALRBeerBongEnv',`
			`max_episode_steps=600,`
			`kwargs={`
			`"difficulty": difficulty,`
			`"reward_type": "staged",`
			`}`
			`)`

improved project structure and exposed methods 2021-08-25 17:16:20 +02:00			`# Motion Primitive Environments`

			`## Simple Reacher`
			`_versions = ["SimpleReacher-v0", "SimpleReacher-v1", "LongSimpleReacher-v0", "LongSimpleReacher-v1"]`
			`for _v in _versions:`
			`_name = _v.split("-")`
			`_env_id = f'{_name[0]}DMP-{_name[1]}'`
			`register(`
			`id=_env_id,`
			`entry_point='alr_envs.utils.make_env_helpers:make_dmp_env_helper',`
			`# max_episode_steps=1,`
			`kwargs={`
			`"name": f"alr_envs:{_v}",`
			`"wrappers": [classic_control.simple_reacher.MPWrapper],`
			`"mp_kwargs": {`
			`"num_dof": 2 if "long" not in _v.lower() else 5,`
			`"num_basis": 5,`
reacher envs pass unittests 2021-11-30 12:05:19 +01:00			`"duration": 2,`
improved project structure and exposed methods 2021-08-25 17:16:20 +02:00			`"alpha_phase": 2,`
			`"learn_goal": True,`
replaced all detpmp with promp 2021-11-30 16:11:32 +01:00			`"policy_type": "motor",`
improved project structure and exposed methods 2021-08-25 17:16:20 +02:00			`"weights_scale": 50,`
replaced all detpmp with promp 2021-11-30 16:11:32 +01:00			`"policy_kwargs": {`
			`"p_gains": .6,`
			`"d_gains": .075`
			`}`
improved project structure and exposed methods 2021-08-25 17:16:20 +02:00			`}`
			`}`
			`)`
			`ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["DMP"].append(_env_id)`

reacher envs cleanup - base classes for direct and torque control - added promp wrapper support 2021-11-26 16:31:46 +01:00			`_env_id = f'{_name[0]}ProMP-{_name[1]}'`
			`register(`
			`id=_env_id,`
			`entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',`
			`kwargs={`
			`"name": f"alr_envs:{_v}",`
			`"wrappers": [classic_control.simple_reacher.MPWrapper],`
			`"mp_kwargs": {`
			`"num_dof": 2 if "long" not in _v.lower() else 5,`
			`"num_basis": 5,`
			`"duration": 2,`
			`"policy_type": "motor",`
			`"weights_scale": 1,`
replaced all detpmp with promp 2021-11-30 16:11:32 +01:00			`"zero_start": True,`
			`"policy_kwargs": {`
			`"p_gains": .6,`
			`"d_gains": .075`
			`}`
reacher envs cleanup - base classes for direct and torque control - added promp wrapper support 2021-11-26 16:31:46 +01:00			`}`
			`}`
			`)`
			`ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)`

improved project structure and exposed methods 2021-08-25 17:16:20 +02:00			`# Viapoint reacher`
			`register(`
			`id='ViaPointReacherDMP-v0',`
			`entry_point='alr_envs.utils.make_env_helpers:make_dmp_env_helper',`
			`# max_episode_steps=1,`
			`kwargs={`
			`"name": "alr_envs:ViaPointReacher-v0",`
			`"wrappers": [classic_control.viapoint_reacher.MPWrapper],`
			`"mp_kwargs": {`
			`"num_dof": 5,`
			`"num_basis": 5,`
			`"duration": 2,`
			`"learn_goal": True,`
			`"alpha_phase": 2,`
			`"policy_type": "velocity",`
			`"weights_scale": 50,`
			`}`
			`}`
			`)`
			`ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["DMP"].append("ViaPointReacherDMP-v0")`

reacher envs cleanup - base classes for direct and torque control - added promp wrapper support 2021-11-26 16:31:46 +01:00			`register(`
			`id="ViaPointReacherProMP-v0",`
			`entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',`
			`kwargs={`
			`"name": f"alr_envs:ViaPointReacher-v0",`
			`"wrappers": [classic_control.viapoint_reacher.MPWrapper],`
			`"mp_kwargs": {`
			`"num_dof": 5,`
			`"num_basis": 5,`
			`"duration": 2,`
replaced all detpmp with promp 2021-11-30 16:11:32 +01:00			`"policy_type": "velocity",`
reacher envs cleanup - base classes for direct and torque control - added promp wrapper support 2021-11-26 16:31:46 +01:00			`"weights_scale": 1,`
			`"zero_start": True`
			`}`
			`}`
			`)`
			`ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append("ViaPointReacherProMP-v0")`

improved project structure and exposed methods 2021-08-25 17:16:20 +02:00			`## Hole Reacher`
			`_versions = ["v0", "v1", "v2"]`
			`for _v in _versions:`
			`_env_id = f'HoleReacherDMP-{_v}'`
			`register(`
			`id=_env_id,`
			`entry_point='alr_envs.utils.make_env_helpers:make_dmp_env_helper',`
			`# max_episode_steps=1,`
			`kwargs={`
			`"name": f"alr_envs:HoleReacher-{_v}",`
			`"wrappers": [classic_control.hole_reacher.MPWrapper],`
			`"mp_kwargs": {`
			`"num_dof": 5,`
			`"num_basis": 5,`
			`"duration": 2,`
			`"learn_goal": True,`
removed old holereacher env 2021-11-30 09:33:26 +01:00			`"alpha_phase": 2.5,`
improved project structure and exposed methods 2021-08-25 17:16:20 +02:00			`"bandwidth_factor": 2,`
			`"policy_type": "velocity",`
			`"weights_scale": 50,`
			`"goal_scale": 0.1`
			`}`
			`}`
			`)`
			`ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["DMP"].append(_env_id)`

added promp wrapped environments 2021-11-15 09:10:03 +01:00			`_env_id = f'HoleReacherProMP-{_v}'`
			`register(`
			`id=_env_id,`
			`entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',`
			`kwargs={`
			`"name": f"alr_envs:HoleReacher-{_v}",`
			`"wrappers": [classic_control.hole_reacher.MPWrapper],`
			`"mp_kwargs": {`
			`"num_dof": 5,`
			`"num_basis": 5,`
			`"duration": 2,`
			`"policy_type": "velocity",`
removed old holereacher env 2021-11-30 09:33:26 +01:00			`"weights_scale": 0.1,`
added promp wrapped environments 2021-11-15 09:10:03 +01:00			`"zero_start": True`
			`}`
			`}`
			`)`
			`ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)`
Added ALRReacherProMP 2022-01-25 15:23:57 +01:00
			`## ALRReacher`
			`_versions = ["ALRReacher-v0", "ALRLongReacher-v0", "ALRReacherSparse-v0", "ALRLongReacherSparse-v0"]`
			`for _v in _versions:`
			`_name = _v.split("-")`
			`_env_id = f'{_name[0]}DMP-{_name[1]}'`
			`register(`
			`id=_env_id,`
			`entry_point='alr_envs.utils.make_env_helpers:make_dmp_env_helper',`
			`# max_episode_steps=1,`
			`kwargs={`
			`"name": f"alr_envs:{_v}",`
			`"wrappers": [mujoco.reacher.MPWrapper],`
			`"mp_kwargs": {`
			`"num_dof": 5 if "long" not in _v.lower() else 7,`
			`"num_basis": 5,`
			`"duration": 4,`
			`"alpha_phase": 2,`
			`"learn_goal": True,`
			`"policy_type": "motor",`
			`"weights_scale": 1,`
			`"policy_kwargs": {`
			`"p_gains": 1,`
			`"d_gains": 0.1`
			`}`
			`}`
			`}`
			`)`
			`ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["DMP"].append(_env_id)`

			`_env_id = f'{_name[0]}ProMP-{_name[1]}'`
			`register(`
			`id=_env_id,`
			`entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',`
			`kwargs={`
			`"name": f"alr_envs:{_v}",`
			`"wrappers": [mujoco.reacher.MPWrapper],`
			`"mp_kwargs": {`
			`"num_dof": 5 if "long" not in _v.lower() else 7,`
			`"num_basis": 5,`
			`"duration": 4,`
			`"policy_type": "motor",`
			`"weights_scale": 1,`
			`"zero_start": True,`
			`"policy_kwargs": {`
			`"p_gains": 1,`
			`"d_gains": 0.1`
			`}`
			`}`
			`}`
			`)`
			`ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)`
added promp wrapped environments 2021-11-15 09:10:03 +01:00
Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00			`## Beerpong`
small bp and tt updates 2021-12-07 14:46:31 +01:00			`_versions = ["v0", "v1", "v2", "v3"]`
			`for _v in _versions:`
			`_env_id = f'BeerpongProMP-{_v}'`
			`register(`
			`id=_env_id,`
			`entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',`
			`kwargs={`
			`"name": f"alr_envs:ALRBeerPong-{_v}",`
			`"wrappers": [mujoco.beerpong.MPWrapper],`
			`"mp_kwargs": {`
			`"num_dof": 7,`
			`"num_basis": 2,`
			`"duration": 1,`
			`"post_traj_time": 2,`
			`"policy_type": "motor",`
			`"weights_scale": 1,`
			`"zero_start": True,`
			`"zero_goal": False,`
			`"policy_kwargs": {`
			`"p_gains": np.array([ 1.5, 5, 2.55, 3, 2., 2, 1.25]),`
			`"d_gains": np.array([0.02333333, 0.1, 0.0625, 0.08, 0.03, 0.03, 0.0125])`
			`}`
Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00			`}`
			`}`
small bp and tt updates 2021-12-07 14:46:31 +01:00			`)`
			`ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)`
Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00
			`## Table Tennis`
updated table tennis and beerpong for promp usage 2021-12-06 13:43:45 +01:00			`ctxt_dim = [2, 4]`
			`for _v, cd in enumerate(ctxt_dim):`
			`_env_id = f'TableTennisProMP-v{_v}'`
			`register(`
			`id=_env_id,`
			`entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',`
			`kwargs={`
			`"name": "alr_envs:TableTennis{}DCtxt-v0".format(cd),`
			`"wrappers": [mujoco.table_tennis.MPWrapper],`
			`"mp_kwargs": {`
			`"num_dof": 7,`
			`"num_basis": 2,`
			`"duration": 1.25,`
			`"post_traj_time": 4.5,`
			`"policy_type": "motor",`
			`"weights_scale": 1.0,`
			`"zero_start": True,`
			`"zero_goal": False,`
			`"policy_kwargs": {`
			`"p_gains": 0.5*np.array([1.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0]),`
			`"d_gains": 0.5*np.array([0.1, 0.4, 0.2, 0.4, 0.1, 0.4, 0.1])`
			`}`
			`}`
			`}`
			`)`
			`ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append(_env_id)`

Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00			`register(`
updated table tennis and beerpong for promp usage 2021-12-06 13:43:45 +01:00			`id='TableTennisProMP-v2',`
Merge branch 'master' into deprecate_detpmp # Conflicts: # README.md # alr_envs/alr/__init__.py 2021-12-01 16:34:18 +01:00			`entry_point='alr_envs.utils.make_env_helpers:make_promp_env_helper',`
Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00			`kwargs={`
updated table tennis and beerpong for promp usage 2021-12-06 13:43:45 +01:00			`"name": "alr_envs:TableTennis2DCtxt-v1",`
Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00			`"wrappers": [mujoco.table_tennis.MPWrapper],`
			`"mp_kwargs": {`
			`"num_dof": 7,`
			`"num_basis": 2,`
updated table tennis and beerpong for promp usage 2021-12-06 13:43:45 +01:00			`"duration": 1.,`
			`"post_traj_time": 2.5,`
Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00			`"policy_type": "motor",`
small bp and tt updates 2021-12-07 14:46:31 +01:00			`"weights_scale": 1,`
			`"off": -0.05,`
			`"bandwidth_factor": 3.5,`
Working Beerpong and TableTennis with MPWrapper 2021-11-05 11:04:04 +01:00			`"zero_start": True,`
			`"zero_goal": False,`
			`"policy_kwargs": {`
			`"p_gains": 0.5*np.array([1.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0]),`
			`"d_gains": 0.5*np.array([0.1, 0.4, 0.2, 0.4, 0.1, 0.4, 0.1])`
			`}`
			`}`
			`}`
			`)`
updated table tennis and beerpong for promp usage 2021-12-06 13:43:45 +01:00			`ALL_ALR_MOTION_PRIMITIVE_ENVIRONMENTS["ProMP"].append("TableTennisProMP-v2")`