fancy_gym/alr_envs/__init__.py

377 lines
8.4 KiB
Python
Raw Normal View History

2020-08-28 18:31:06 +02:00
from gym.envs.registration import register
2020-11-03 11:26:06 +01:00
from alr_envs.stochastic_search.functions.f_rosenbrock import Rosenbrock
2021-04-21 10:45:34 +02:00
# from alr_envs.utils.wrapper.dmp_wrapper import DmpWrapper
# Mujoco
2020-11-03 11:26:06 +01:00
2020-08-28 18:31:06 +02:00
register(
id='ALRReacher-v0',
entry_point='alr_envs.mujoco:ALRReacherEnv',
2020-09-19 17:47:20 +02:00
max_episode_steps=200,
kwargs={
"steps_before_reward": 0,
2020-09-22 17:41:25 +02:00
"n_links": 5,
"balance": False,
2020-09-22 17:41:25 +02:00
}
)
register(
id='ALRReacherSparse-v0',
2020-09-26 15:07:42 +02:00
entry_point='alr_envs.mujoco:ALRReacherEnv',
max_episode_steps=200,
2020-09-26 15:07:42 +02:00
kwargs={
"steps_before_reward": 200,
2020-09-26 15:07:42 +02:00
"n_links": 5,
"balance": False,
2020-09-26 15:07:42 +02:00
}
)
2020-09-22 17:41:25 +02:00
register(
id='ALRReacherSparseBalanced-v0',
2020-09-22 17:41:25 +02:00
entry_point='alr_envs.mujoco:ALRReacherEnv',
max_episode_steps=200,
kwargs={
"steps_before_reward": 200,
"n_links": 5,
"balance": True,
2020-09-19 17:47:20 +02:00
}
)
register(
id='ALRLongReacher-v0',
2020-09-19 17:47:20 +02:00
entry_point='alr_envs.mujoco:ALRReacherEnv',
max_episode_steps=200,
2020-09-19 17:47:20 +02:00
kwargs={
"steps_before_reward": 0,
"n_links": 7,
"balance": False,
2020-09-19 17:47:20 +02:00
}
)
register(
id='ALRLongReacherSparse-v0',
2020-09-19 17:47:20 +02:00
entry_point='alr_envs.mujoco:ALRReacherEnv',
max_episode_steps=200,
kwargs={
"steps_before_reward": 200,
2020-09-19 17:47:20 +02:00
"n_links": 7,
"balance": False,
2020-09-19 17:47:20 +02:00
}
)
register(
id='ALRLongReacherSparseBalanced-v0',
2020-09-19 17:47:20 +02:00
entry_point='alr_envs.mujoco:ALRReacherEnv',
max_episode_steps=200,
kwargs={
"steps_before_reward": 200,
2020-09-19 17:47:20 +02:00
"n_links": 7,
"balance": True,
2020-09-19 17:47:20 +02:00
}
)
2021-04-23 12:47:55 +02:00
register(
id='ALRBallInACupSimple-v0',
entry_point='alr_envs.mujoco:ALRBallInACupEnv',
max_episode_steps=4000,
kwargs={
"simplified": True,
"reward_type": "no_context"
}
)
2021-04-23 11:37:42 +02:00
register(
2021-04-23 12:16:19 +02:00
id='ALRBallInACup-v0',
2021-04-23 11:37:42 +02:00
entry_point='alr_envs.mujoco:ALRBallInACupEnv',
max_episode_steps=4000,
kwargs={
2021-04-23 12:47:55 +02:00
"reward_type": "no_context"
2021-04-23 11:37:42 +02:00
}
)
register(
id='ALRBallInACupGoal-v0',
entry_point='alr_envs.mujoco:ALRBallInACupEnv',
max_episode_steps=4000,
kwargs={
"reward_type": "contextual_goal"
}
)
# Classic control
2020-09-19 17:47:20 +02:00
register(
2021-03-26 15:57:15 +01:00
id='Balancing-v0',
entry_point='alr_envs.mujoco:BalancingEnv',
max_episode_steps=200,
2020-09-19 17:47:20 +02:00
kwargs={
2021-03-26 15:57:15 +01:00
"n_links": 5,
2020-09-19 17:47:20 +02:00
}
2020-08-28 18:31:06 +02:00
)
register(
id='SimpleReacher-v0',
entry_point='alr_envs.classic_control:SimpleReacherEnv',
max_episode_steps=200,
2020-08-28 18:31:06 +02:00
kwargs={
"n_links": 2,
}
)
2021-05-07 09:51:53 +02:00
register(
id='SimpleReacher-v1',
entry_point='alr_envs.classic_control:SimpleReacherEnv',
max_episode_steps=200,
kwargs={
"n_links": 2,
"random_start": False
}
)
2021-05-10 12:17:52 +02:00
register(
id='EpisodicSimpleReacher-v0',
entry_point='alr_envs.classic_control:EpisodicSimpleReacherEnv',
max_episode_steps=200,
kwargs={
"n_links": 2,
}
)
register(
id='EpisodicSimpleReacher-v1',
entry_point='alr_envs.classic_control:EpisodicSimpleReacherEnv',
max_episode_steps=200,
kwargs={
"n_links": 2,
"random_start": False
}
)
2021-03-26 15:32:50 +01:00
register(
id='LongSimpleReacher-v0',
entry_point='alr_envs.classic_control:SimpleReacherEnv',
2021-03-26 15:32:50 +01:00
max_episode_steps=200,
kwargs={
"n_links": 5,
}
)
register(
id='ViaPointReacher-v0',
entry_point='alr_envs.classic_control.viapoint_reacher:ViaPointReacher',
max_episode_steps=200,
kwargs={
"n_links": 5,
"allow_self_collision": False,
"collision_penalty": 1000
2020-08-28 18:31:06 +02:00
}
)
2020-11-03 11:26:06 +01:00
register(
id='HoleReacher-v0',
entry_point='alr_envs.classic_control.hole_reacher:HoleReacher',
2020-11-03 11:26:06 +01:00
max_episode_steps=200,
kwargs={
"n_links": 5,
"allow_self_collision": False,
"allow_wall_collision": False,
2021-04-21 10:45:34 +02:00
"hole_width": 0.25,
"hole_depth": 1,
2021-04-21 10:45:34 +02:00
"hole_x": 2,
"collision_penalty": 100,
2020-11-03 11:26:06 +01:00
}
)
2021-05-07 09:51:53 +02:00
register(
id='HoleReacher-v2',
entry_point='alr_envs.classic_control.hole_reacher_v2:HoleReacher',
max_episode_steps=200,
kwargs={
"n_links": 5,
"allow_self_collision": False,
"allow_wall_collision": False,
"hole_width": 0.25,
"hole_depth": 1,
"hole_x": 2,
"collision_penalty": 100,
}
)
2021-04-21 10:45:34 +02:00
# MP environments
2021-05-07 09:51:53 +02:00
register(
id='SimpleReacherDMP-v0',
entry_point='alr_envs.utils.make_env_helpers:make_dmp_env',
# max_episode_steps=1,
kwargs={
2021-05-10 12:17:52 +02:00
"name": "alr_envs:EpisodicSimpleReacher-v0",
2021-05-07 09:51:53 +02:00
"num_dof": 2,
"num_basis": 5,
"duration": 2,
"alpha_phase": 2,
"learn_goal": True,
"policy_type": "velocity",
"weights_scale": 50,
}
)
register(
id='SimpleReacherDMP-v1',
entry_point='alr_envs.utils.make_env_helpers:make_dmp_env',
# max_episode_steps=1,
kwargs={
2021-05-10 12:17:52 +02:00
"name": "alr_envs:EpisodicSimpleReacher-v1",
2021-05-07 09:51:53 +02:00
"num_dof": 2,
"num_basis": 5,
"duration": 2,
"alpha_phase": 2,
"learn_goal": True,
"policy_type": "velocity",
"weights_scale": 50,
}
)
register(
id='ViaPointReacherDMP-v0',
2021-04-21 10:45:34 +02:00
entry_point='alr_envs.utils.make_env_helpers:make_dmp_env',
# max_episode_steps=1,
2021-04-21 10:45:34 +02:00
kwargs={
"name": "alr_envs:ViaPointReacher-v0",
"num_dof": 5,
"num_basis": 5,
"duration": 2,
"alpha_phase": 2,
"learn_goal": False,
"policy_type": "velocity",
"weights_scale": 50,
}
)
register(
id='HoleReacherDMP-v0',
2021-04-21 10:45:34 +02:00
entry_point='alr_envs.utils.make_env_helpers:make_dmp_env',
# max_episode_steps=1,
2021-04-21 10:45:34 +02:00
kwargs={
"name": "alr_envs:HoleReacher-v0",
"num_dof": 5,
"num_basis": 5,
"duration": 2,
"learn_goal": True,
"alpha_phase": 2,
"bandwidth_factor": 2,
"policy_type": "velocity",
"weights_scale": 50,
"goal_scale": 0.1
}
)
2021-05-07 09:51:53 +02:00
register(
id='HoleReacherDMP-v2',
entry_point='alr_envs.utils.make_env_helpers:make_dmp_env',
# max_episode_steps=1,
kwargs={
"name": "alr_envs:HoleReacher-v2",
"num_dof": 5,
"num_basis": 5,
"duration": 2,
"learn_goal": True,
"alpha_phase": 2,
"bandwidth_factor": 2,
"policy_type": "velocity",
"weights_scale": 50,
"goal_scale": 0.1
}
)
2021-04-21 10:45:34 +02:00
# TODO: properly add final_pos
register(
id='HoleReacherFixedGoalDMP-v0',
2021-04-21 10:45:34 +02:00
entry_point='alr_envs.utils.make_env_helpers:make_dmp_env',
# max_episode_steps=1,
2021-04-21 10:45:34 +02:00
kwargs={
"name": "alr_envs:HoleReacher-v0",
"num_dof": 5,
"num_basis": 5,
"duration": 2,
"learn_goal": False,
"alpha_phase": 2,
"policy_type": "velocity",
"weights_scale": 50,
"goal_scale": 0.1
}
)
2021-04-23 11:37:42 +02:00
# register(
# id='HoleReacherDetPMP-v0',
# entry_point='alr_envs.classic_control.hole_reacher:holereacher_detpmp',
# # max_episode_steps=1,
# # TODO: add mp kwargs
# )
register(
2021-04-23 11:37:42 +02:00
id='ALRBallInACupSimpleDMP-v0',
entry_point='alr_envs.utils.make_env_helpers:make_dmp_env',
kwargs={
2021-04-23 12:47:55 +02:00
"name": "alr_envs:ALRBallInACupSimple-v0",
2021-04-23 11:37:42 +02:00
"num_dof": 3,
"num_basis": 5,
"duration": 3.5,
"post_traj_time": 4.5,
"learn_goal": False,
"alpha_phase": 3,
"bandwidth_factor": 2.5,
"policy_type": "motor",
"weights_scale": 100,
"return_to_start": True
}
2021-04-21 10:45:34 +02:00
)
2021-04-23 12:16:19 +02:00
register(
id='ALRBallInACupDMP-v0',
entry_point='alr_envs.utils.make_env_helpers:make_dmp_env',
kwargs={
"name": "alr_envs:ALRBallInACup-v0",
"num_dof": 7,
"num_basis": 5,
"duration": 3.5,
"post_traj_time": 4.5,
"learn_goal": False,
"alpha_phase": 3,
"bandwidth_factor": 2.5,
"policy_type": "motor",
"weights_scale": 100,
"return_to_start": True
}
)
2021-04-21 10:45:34 +02:00
register(
2021-04-23 11:37:42 +02:00
id='ALRBallInACupGoalDMP-v0',
2021-04-23 12:47:55 +02:00
entry_point='alr_envs.utils.make_env_helpers:make_contextual_env',
2021-04-21 10:45:34 +02:00
kwargs={
2021-04-23 11:37:42 +02:00
"name": "alr_envs:ALRBallInACupGoal-v0",
2021-04-23 12:16:19 +02:00
"num_dof": 7,
2021-04-21 10:45:34 +02:00
"num_basis": 5,
2021-04-23 12:16:19 +02:00
"duration": 3.5,
"post_traj_time": 4.5,
2021-04-21 10:45:34 +02:00
"learn_goal": True,
2021-04-23 12:16:19 +02:00
"alpha_phase": 3,
"bandwidth_factor": 2.5,
"policy_type": "motor",
2021-04-21 10:45:34 +02:00
"weights_scale": 50,
"goal_scale": 0.1
}
)
# BBO functions
2020-11-03 11:26:06 +01:00
for dim in [5, 10, 25, 50, 100]:
register(
id=f'Rosenbrock{dim}-v0',
entry_point='alr_envs.stochastic_search:StochasticSearchEnv',
max_episode_steps=1,
kwargs={
"cost_f": Rosenbrock(dim),
2020-11-03 11:26:06 +01:00
}
)