From 78edfb8da790c450dc2dd65018fbcead8f22bdc1 Mon Sep 17 00:00:00 2001
From: Onur <celik@kit.edu>
Date: Thu, 7 Jul 2022 10:55:36 +0200
Subject: [PATCH] fix hopper jump reward bug

---
 alr_envs/alr/mujoco/hopper_jump/hopper_jump.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/alr_envs/alr/mujoco/hopper_jump/hopper_jump.py b/alr_envs/alr/mujoco/hopper_jump/hopper_jump.py
index f915e9e..74643f3 100644
--- a/alr_envs/alr/mujoco/hopper_jump/hopper_jump.py
+++ b/alr_envs/alr/mujoco/hopper_jump/hopper_jump.py
@@ -90,10 +90,9 @@ class HopperJumpEnv(HopperEnv):
         rewards = 0
         if not self.sparse or (self.sparse and self._steps >= MAX_EPISODE_STEPS_HOPPERJUMP):
             healthy_reward = self.healthy_reward
-            distance_reward = goal_dist * self._dist_weight
+            distance_reward = -goal_dist * self._dist_weight
             height_reward = (self.max_height if self.sparse else self.get_body_com("torso")[2]) * self._height_weight
-            contact_reward = (self.contact_dist or 5) * self._contact_weight
-            # dist_reward = self._forward_reward_weight * (-3 * goal_dist + 10 * self.max_height - 2 * contact_dist)
+            contact_reward = -(self.contact_dist or 5) * self._contact_weight
             rewards = self._forward_reward_weight * (distance_reward + height_reward + contact_reward + healthy_reward)
 
         observation = self._get_obs()