Lowered Aux-Reward (now per-second instead of per frame)
This commit is contained in:
		
							parent
							
								
									54adebfe9b
								
							
						
					
					
						commit
						a9b53b6eca
					
				| @ -123,7 +123,7 @@ class ColumbusEnv(gym.Env): | |||||||
|                             self.aux_reward_discretize / 2 |                             self.aux_reward_discretize / 2 | ||||||
| 
 | 
 | ||||||
|                     aux_reward -= penalty |                     aux_reward -= penalty | ||||||
|         return aux_reward |         return aux_reward/self.fps | ||||||
| 
 | 
 | ||||||
|     def step(self, action): |     def step(self, action): | ||||||
|         # TODO: Just make the range consistent... |         # TODO: Just make the range consistent... | ||||||
| @ -381,7 +381,7 @@ class ColumbusCandyland(ColumbusEnv): | |||||||
| class ColumbusCandyland_Aux10(ColumbusCandyland): | class ColumbusCandyland_Aux10(ColumbusCandyland): | ||||||
|     def __init__(self, fps=30): |     def __init__(self, fps=30): | ||||||
|         super(ColumbusCandyland_Aux10, self).__init__(fps=fps) |         super(ColumbusCandyland_Aux10, self).__init__(fps=fps) | ||||||
|         self.aux_reward_max = 10 |         self.aux_reward_max = 1 | ||||||
| 
 | 
 | ||||||
| 
 | 
 | ||||||
| class ColumbusEasyObstacles(ColumbusEnv): | class ColumbusEasyObstacles(ColumbusEnv): | ||||||
| @ -389,7 +389,7 @@ class ColumbusEasyObstacles(ColumbusEnv): | |||||||
|         super(ColumbusEasyObstacles, self).__init__( |         super(ColumbusEasyObstacles, self).__init__( | ||||||
|             observable=observable,  fps=fps, env_seed=env_seed) |             observable=observable,  fps=fps, env_seed=env_seed) | ||||||
|         self.draw_entities = not hide_map |         self.draw_entities = not hide_map | ||||||
|         self.aux_reward_max = 0.1 |         self.aux_reward_max = 1 | ||||||
| 
 | 
 | ||||||
|     def setup(self): |     def setup(self): | ||||||
|         self.agent.pos = self.start_pos |         self.agent.pos = self.start_pos | ||||||
| @ -412,7 +412,7 @@ class ColumbusEasierObstacles(ColumbusEnv): | |||||||
|         super(ColumbusEasierObstacles, self).__init__( |         super(ColumbusEasierObstacles, self).__init__( | ||||||
|             observable=observable,  fps=fps, env_seed=env_seed) |             observable=observable,  fps=fps, env_seed=env_seed) | ||||||
|         self.draw_entities = not hide_map |         self.draw_entities = not hide_map | ||||||
|         self.aux_reward_max = 0.5 |         self.aux_reward_max = 1 | ||||||
| 
 | 
 | ||||||
|     def setup(self): |     def setup(self): | ||||||
|         self.agent.pos = self.start_pos |         self.agent.pos = self.start_pos | ||||||
|  | |||||||
		Loading…
	
		Reference in New Issue
	
	Block a user