From 17c489d62242030c3814364c791392b4f29943ab Mon Sep 17 00:00:00 2001 From: ottofabian Date: Wed, 19 May 2021 18:02:34 +0200 Subject: [PATCH] fixed incorrect sampling in hole reacher --- alr_envs/classic_control/hole_reacher.py | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/alr_envs/classic_control/hole_reacher.py b/alr_envs/classic_control/hole_reacher.py index 064b94b..a4f1f33 100644 --- a/alr_envs/classic_control/hole_reacher.py +++ b/alr_envs/classic_control/hole_reacher.py @@ -105,8 +105,8 @@ class HoleReacherEnv(MPEnv): return self._get_obs().copy() def _generate_hole(self): - self._tmp_hole_x = self.np_random.uniform(0.5, 3.5, 1) if self._hole_x is None else np.copy(self._hole_x) - self._tmp_hole_width = self.np_random.uniform(0.5, 0.1, 1) if self._hole_width is None else np.copy( + self._tmp_hole_x = self.np_random.uniform(1, 3.5, 1) if self._hole_x is None else np.copy(self._hole_x) + self._tmp_hole_width = self.np_random.uniform(0.15, 0.5, 1) if self._hole_width is None else np.copy( self._hole_width) # TODO we do not want this right now. self._tmp_hole_depth = self.np_random.uniform(1, 1, 1) if self._hole_depth is None else np.copy( @@ -310,12 +310,13 @@ if __name__ == '__main__': hole_depth=1, hole_x=None) obs = env.reset() - for i in range(200): + for i in range(2000): # objective.load_result("/tmp/cma") # test with random actions ac = 2 * env.action_space.sample() obs, rew, d, info = env.step(ac) - env.render(mode=render_mode) + if i % 10 == 0: + env.render(mode=render_mode) print(rew)