Implemented Rectangles (no Raycasting yet...)
This commit is contained in:
parent
908685b2f5
commit
c34d266ea5
@ -4,14 +4,13 @@ import math
|
|||||||
|
|
||||||
class Entity(object):
|
class Entity(object):
|
||||||
def __init__(self, env):
|
def __init__(self, env):
|
||||||
|
self.shape = None
|
||||||
self.env = env
|
self.env = env
|
||||||
self.pos = (env.random(), env.random())
|
self.pos = (env.random(), env.random())
|
||||||
self.speed = (0, 0)
|
self.speed = (0, 0)
|
||||||
self.acc = (0, 0)
|
self.acc = (0, 0)
|
||||||
self.drag = 0
|
self.drag = 0
|
||||||
self.radius = 10
|
|
||||||
self.col = (255, 255, 255)
|
self.col = (255, 255, 255)
|
||||||
self.shape = 'circle'
|
|
||||||
self.solid = False
|
self.solid = False
|
||||||
self.movable = False # False = Non movable, True = Movable, x>1: lighter movable
|
self.movable = False # False = Non movable, True = Movable, x>1: lighter movable
|
||||||
self.elasticity = 1
|
self.elasticity = 1
|
||||||
@ -48,9 +47,8 @@ class Entity(object):
|
|||||||
self._crash_list = []
|
self._crash_list = []
|
||||||
|
|
||||||
def draw(self):
|
def draw(self):
|
||||||
x, y = self.pos
|
raise Exception(
|
||||||
pygame.draw.circle(self.env.surface, self.col,
|
'[!] draw not implemented for shape "'+str(self.shape)+'"')
|
||||||
(x*self.env.width, y*self.env.height), self.radius, width=0)
|
|
||||||
|
|
||||||
def on_collision(self, other, depth):
|
def on_collision(self, other, depth):
|
||||||
if self.solid and other.solid:
|
if self.solid and other.solid:
|
||||||
@ -61,7 +59,8 @@ class Entity(object):
|
|||||||
if other in self._crash_list:
|
if other in self._crash_list:
|
||||||
return
|
return
|
||||||
self._crash_list.append(other)
|
self._crash_list.append(other)
|
||||||
force_dir = self.pos[0] - other.pos[0], self.pos[1] - other.pos[1]
|
force_dir = self._get_crash_force_dir(other)
|
||||||
|
print(force_dir, depth)
|
||||||
force_dir_len = math.sqrt(force_dir[0]**2+force_dir[1]**2)
|
force_dir_len = math.sqrt(force_dir[0]**2+force_dir[1]**2)
|
||||||
if force_dir_len == 0:
|
if force_dir_len == 0:
|
||||||
return
|
return
|
||||||
@ -82,9 +81,19 @@ class Entity(object):
|
|||||||
self.env.speed_fac, self.pos[1] - self.env.inp[1] * \
|
self.env.speed_fac, self.pos[1] - self.env.inp[1] * \
|
||||||
self._coll_add_pushback*self.env.speed_fac
|
self._coll_add_pushback*self.env.speed_fac
|
||||||
if self.collision_changes_speed:
|
if self.collision_changes_speed:
|
||||||
|
oldspeed = math.sqrt(self.speed[0]**2+self.speed[1]**2)
|
||||||
self.speed = self.speed[0] + \
|
self.speed = self.speed[0] + \
|
||||||
force_vec[0]*self.collision_elasticity/self.env.speed_fac, self.speed[1] + \
|
force_vec[0]*self.collision_elasticity/self.env.speed_fac, self.speed[1] + \
|
||||||
force_vec[1]*self.collision_elasticity/self.env.speed_fac
|
force_vec[1]*self.collision_elasticity/self.env.speed_fac
|
||||||
|
newspeed = math.sqrt(self.speed[0]**2+self.speed[1]**2)
|
||||||
|
if newspeed > oldspeed*1.1:
|
||||||
|
self.speed = self.speed[0]/newspeed*1.1 * \
|
||||||
|
oldspeed, self.speed[1]/newspeed*oldspeed*1.1
|
||||||
|
|
||||||
|
def _get_crash_force_dir(self, other):
|
||||||
|
if 1 == 1: # linter hack
|
||||||
|
raise Exception(
|
||||||
|
'[!] No collision-logic implemented for shape"'+str(self.shape)+'"')
|
||||||
|
|
||||||
def on_collect(self, other):
|
def on_collect(self, other):
|
||||||
pass
|
pass
|
||||||
@ -105,7 +114,94 @@ class Entity(object):
|
|||||||
self.env.kill_entity(self)
|
self.env.kill_entity(self)
|
||||||
|
|
||||||
|
|
||||||
class Agent(Entity):
|
class CircularEntity(Entity):
|
||||||
|
def __init__(self, env):
|
||||||
|
super().__init__(env)
|
||||||
|
self.shape = 'circle'
|
||||||
|
self.radius = 10
|
||||||
|
|
||||||
|
def draw(self):
|
||||||
|
x, y = self.pos
|
||||||
|
pygame.draw.circle(self.env.surface, self.col,
|
||||||
|
(x*self.env.width, y*self.env.height), self.radius, width=0)
|
||||||
|
|
||||||
|
def _get_crash_force_dir(self, other):
|
||||||
|
if other.shape == 'circle':
|
||||||
|
return self.pos[0] - other.pos[0], self.pos[1] - other.pos[1]
|
||||||
|
elif other.shape == 'rect':
|
||||||
|
pad = 0
|
||||||
|
edge_size = min(self.radius, min(
|
||||||
|
other.width/3, other.height/3)) + 1
|
||||||
|
|
||||||
|
x, y = self.pos
|
||||||
|
x, y = x*self.env.height, y*self.env.width
|
||||||
|
left, top = x - self.radius + pad, y - self.radius + pad
|
||||||
|
right, bottom = x + self.radius - pad, y + self.radius - pad
|
||||||
|
lrcenter, tbcenter = x, y
|
||||||
|
|
||||||
|
ox, oy = other.pos
|
||||||
|
ox, oy = ox*self.env.height, oy*self.env.width
|
||||||
|
oleft, otop = ox + pad, oy + pad
|
||||||
|
oright, obottom = ox + other.width - pad, oy + other.height - pad
|
||||||
|
olrcenter, otbcenter = ox + other.width/2, oy + other.height/2
|
||||||
|
|
||||||
|
lr, tb = 0, 0
|
||||||
|
|
||||||
|
if otop < bottom and obottom > bottom:
|
||||||
|
# col from top
|
||||||
|
tb = otop - bottom
|
||||||
|
#print('t', tb)
|
||||||
|
elif top < obottom and top > otop:
|
||||||
|
# col from bottom
|
||||||
|
tb = - top + obottom
|
||||||
|
#print('b', tb)
|
||||||
|
|
||||||
|
if right > oleft and right < oright:
|
||||||
|
# col from left
|
||||||
|
lr = oleft - right
|
||||||
|
#print('l', lr)
|
||||||
|
elif left < oright and left > oleft:
|
||||||
|
# col from right
|
||||||
|
lr = - left + oright
|
||||||
|
#print('r', lr)
|
||||||
|
|
||||||
|
if lr != 0 and tb != 0:
|
||||||
|
if abs(abs(tb) - abs(lr)) < edge_size:
|
||||||
|
if abs(tb) < abs(lr):
|
||||||
|
return lr/5, tb
|
||||||
|
else:
|
||||||
|
return lr, tb/5
|
||||||
|
if abs(tb) < abs(lr):
|
||||||
|
return 0, tb
|
||||||
|
else:
|
||||||
|
return lr, 0
|
||||||
|
|
||||||
|
return 0, 0
|
||||||
|
else:
|
||||||
|
raise Exception(
|
||||||
|
'[!] Shape "circle" does not know how to collide with shape "'+str(other.shape)+'"')
|
||||||
|
|
||||||
|
|
||||||
|
class RectangularEntity(Entity):
|
||||||
|
def __init__(self, env):
|
||||||
|
super().__init__(env)
|
||||||
|
self.shape = 'rect'
|
||||||
|
self.width = 10
|
||||||
|
self.height = 10
|
||||||
|
|
||||||
|
def draw(self):
|
||||||
|
x, y = self.pos
|
||||||
|
rect = pygame.Rect(x*self.env.width, y *
|
||||||
|
self.env.width, self.width, self.height)
|
||||||
|
pygame.draw.rect(self.env.surface, self.col,
|
||||||
|
rect, width=0)
|
||||||
|
|
||||||
|
def _get_crash_force_dir(self, other):
|
||||||
|
raise Exception(
|
||||||
|
'[!] Collisions in this direction not implemented for shape "rectangle"')
|
||||||
|
|
||||||
|
|
||||||
|
class Agent(CircularEntity):
|
||||||
def __init__(self, env):
|
def __init__(self, env):
|
||||||
super(Agent, self).__init__(env)
|
super(Agent, self).__init__(env)
|
||||||
self.pos = (0.5, 0.5)
|
self.pos = (0.5, 0.5)
|
||||||
@ -148,12 +244,17 @@ class Barrier(Enemy):
|
|||||||
self.movable = False
|
self.movable = False
|
||||||
|
|
||||||
|
|
||||||
class CircleBarrier(Barrier):
|
class CircleBarrier(Barrier, CircularEntity):
|
||||||
def __init__(self, env):
|
def __init__(self, env):
|
||||||
super(CircleBarrier, self).__init__(env)
|
super(CircleBarrier, self).__init__(env)
|
||||||
|
|
||||||
|
|
||||||
class Chaser(Enemy):
|
class RectBarrier(Barrier, RectangularEntity):
|
||||||
|
def __init__(self, env):
|
||||||
|
super().__init__(env)
|
||||||
|
|
||||||
|
|
||||||
|
class Chaser(Enemy, CircularEntity):
|
||||||
def __init__(self, env):
|
def __init__(self, env):
|
||||||
super(Chaser, self).__init__(env)
|
super(Chaser, self).__init__(env)
|
||||||
self.target = self.env.agent
|
self.target = self.env.agent
|
||||||
@ -193,7 +294,7 @@ class FlyingChaser(Chaser):
|
|||||||
self.acc = arrow[0] * self.chase_acc, arrow[1] * self.chase_acc
|
self.acc = arrow[0] * self.chase_acc, arrow[1] * self.chase_acc
|
||||||
|
|
||||||
|
|
||||||
class Collectable(Entity):
|
class Collectable(CircularEntity):
|
||||||
def __init__(self, env):
|
def __init__(self, env):
|
||||||
super(Collectable, self).__init__(env)
|
super(Collectable, self).__init__(env)
|
||||||
self.avaible = True
|
self.avaible = True
|
||||||
@ -271,7 +372,7 @@ class TimeoutReward(OnceReward):
|
|||||||
self.env.timers.append((self.timeout, self.set_avaible, True))
|
self.env.timers.append((self.timeout, self.set_avaible, True))
|
||||||
|
|
||||||
|
|
||||||
class Ball(Entity):
|
class Ball(CircularEntity):
|
||||||
def __init__(self, env):
|
def __init__(self, env):
|
||||||
super(Ball, self).__init__(env)
|
super(Ball, self).__init__(env)
|
||||||
self.col = (255, 128, 0)
|
self.col = (255, 128, 0)
|
||||||
|
243
columbus/env.py
243
columbus/env.py
@ -45,7 +45,7 @@ def parseObs(obsConf):
|
|||||||
class ColumbusEnv(gym.Env):
|
class ColumbusEnv(gym.Env):
|
||||||
metadata = {'render.modes': ['human']}
|
metadata = {'render.modes': ['human']}
|
||||||
|
|
||||||
def __init__(self, observable=observables.Observable(), fps=60, env_seed=3.1, master_seed=None, start_pos=(0.5, 0.5), start_score=0, speed_fac=0.01, acc_fac=0.02, die_on_zero=False, return_on_score=-1, reward_mult=1, agent_drag=0, controll_type='SPEED', aux_reward_max=1, aux_penalty_max=0, aux_reward_discretize=0, void_is_type_barrier=True, void_damage=1, torus_topology=False, default_collision_elasticity=1):
|
def __init__(self, observable=observables.Observable(), fps=60, env_seed=3.1, master_seed=None, start_pos=(0.5, 0.5), start_score=0, speed_fac=0.01, acc_fac=0.04, die_on_zero=False, return_on_score=-1, reward_mult=1, agent_drag=0, controll_type='SPEED', aux_reward_max=1, aux_penalty_max=0, aux_reward_discretize=0, void_is_type_barrier=True, void_damage=1, torus_topology=False, default_collision_elasticity=1):
|
||||||
super(ColumbusEnv, self).__init__()
|
super(ColumbusEnv, self).__init__()
|
||||||
self.action_space = spaces.Box(
|
self.action_space = spaces.Box(
|
||||||
low=-1, high=1, shape=(2,), dtype=np.float32)
|
low=-1, high=1, shape=(2,), dtype=np.float32)
|
||||||
@ -79,6 +79,7 @@ class ColumbusEnv(gym.Env):
|
|||||||
self.aux_reward_discretize = aux_reward_discretize
|
self.aux_reward_discretize = aux_reward_discretize
|
||||||
# 0 = dont discretize; how many steps (along diagonal)
|
# 0 = dont discretize; how many steps (along diagonal)
|
||||||
self.aux_reward_discretize = 0
|
self.aux_reward_discretize = 0
|
||||||
|
self.penalty_from_edges = False
|
||||||
self.draw_observable = True
|
self.draw_observable = True
|
||||||
self.draw_joystick = True
|
self.draw_joystick = True
|
||||||
self.draw_entities = True
|
self.draw_entities = True
|
||||||
@ -169,6 +170,11 @@ class ColumbusEnv(gym.Env):
|
|||||||
aux_reward += reward
|
aux_reward += reward
|
||||||
elif isinstance(entity, entities.Enemy):
|
elif isinstance(entity, entities.Enemy):
|
||||||
if entity.radiateDamage:
|
if entity.radiateDamage:
|
||||||
|
if self.penalty_from_edges:
|
||||||
|
penalty = self.aux_penalty_max / \
|
||||||
|
(1 + self.sq_dist(entity.pos,
|
||||||
|
self.agent.pos) - entity.radius - self.agent.redius)
|
||||||
|
else:
|
||||||
penalty = self.aux_penalty_max / \
|
penalty = self.aux_penalty_max / \
|
||||||
(1 + self.sq_dist(entity.pos, self.agent.pos))
|
(1 + self.sq_dist(entity.pos, self.agent.pos))
|
||||||
|
|
||||||
@ -220,12 +226,16 @@ class ColumbusEnv(gym.Env):
|
|||||||
other.on_collision(entity, depth)
|
other.on_collision(entity, depth)
|
||||||
|
|
||||||
def _check_collision_between(self, e1, e2):
|
def _check_collision_between(self, e1, e2):
|
||||||
|
e = [e1, e2]
|
||||||
|
e.sort(key=lambda x: x.shape)
|
||||||
|
e1, e2 = e
|
||||||
shapes = [e1.shape, e2.shape]
|
shapes = [e1.shape, e2.shape]
|
||||||
shapes.sort()
|
|
||||||
if shapes == ['circle', 'circle']:
|
if shapes == ['circle', 'circle']:
|
||||||
dist = math.sqrt(((e1.pos[0]-e2.pos[0])*self.width) ** 2
|
dist = math.sqrt(((e1.pos[0]-e2.pos[0])*self.width) ** 2
|
||||||
+ ((e1.pos[1]-e2.pos[1])*self.height)**2)
|
+ ((e1.pos[1]-e2.pos[1])*self.height)**2)
|
||||||
return max(0, e1.radius + e2.radius - dist)
|
return max(0, e1.radius + e2.radius - dist)
|
||||||
|
elif shapes == ['circle', 'rect']:
|
||||||
|
return sum([abs(d) for d in e1._get_crash_force_dir(e2)])
|
||||||
else:
|
else:
|
||||||
raise Exception(
|
raise Exception(
|
||||||
'Checking for collision between unsupported shapes: '+str(shapes))
|
'Checking for collision between unsupported shapes: '+str(shapes))
|
||||||
@ -406,6 +416,29 @@ class ColumbusTest3_1(ColumbusEnv):
|
|||||||
self.entities.append(reward)
|
self.entities.append(reward)
|
||||||
|
|
||||||
|
|
||||||
|
class ColumbusTestRect(ColumbusEnv):
|
||||||
|
def __init__(self, observable=observables.Observable(), fps=30, aux_reward_max=1, **kw):
|
||||||
|
super().__init__(
|
||||||
|
observable=observable, fps=fps, env_seed=3.3, aux_reward_max=aux_reward_max, controll_type='ACC', **kw)
|
||||||
|
self.start_pos = [0.5, 0.5]
|
||||||
|
self.score = 0
|
||||||
|
|
||||||
|
def setup(self):
|
||||||
|
self.agent.pos = self.start_pos
|
||||||
|
for i in range(1):
|
||||||
|
enemy = entities.RectBarrier(self)
|
||||||
|
enemy.width = self.random()*40+50
|
||||||
|
enemy.height = self.random()*40+50
|
||||||
|
self.entities.append(enemy)
|
||||||
|
for i in range(1):
|
||||||
|
enemy = entities.CircleBarrier(self)
|
||||||
|
enemy.radius = self.random()*40+50
|
||||||
|
self.entities.append(enemy)
|
||||||
|
for i in range(1):
|
||||||
|
reward = entities.TeleportingReward(self)
|
||||||
|
self.entities.append(reward)
|
||||||
|
|
||||||
|
|
||||||
class ColumbusTestRay(ColumbusTest3_1):
|
class ColumbusTestRay(ColumbusTest3_1):
|
||||||
def __init__(self, observable=observables.RayObservable(), hide_map=False, fps=30, **kw):
|
def __init__(self, observable=observables.RayObservable(), hide_map=False, fps=30, **kw):
|
||||||
super(ColumbusTestRay, self).__init__(
|
super(ColumbusTestRay, self).__init__(
|
||||||
@ -421,6 +454,74 @@ class ColumbusRayDrone(ColumbusTestRay):
|
|||||||
self.agent_drag = 0.02
|
self.agent_drag = 0.02
|
||||||
|
|
||||||
|
|
||||||
|
class ColumbusDemoEnv3_1(ColumbusEnv):
|
||||||
|
def __init__(self, observable=observables.Observable(), fps=30, aux_reward_max=1, **kw):
|
||||||
|
super().__init__(
|
||||||
|
observable=observable, fps=fps, env_seed=3.1, aux_reward_max=aux_reward_max, controll_type='ACC', agent_drag=0.05, **kw)
|
||||||
|
self.start_pos = [0.6, 0.3]
|
||||||
|
self.score = 0
|
||||||
|
|
||||||
|
def setup(self):
|
||||||
|
self.agent.pos = self.start_pos
|
||||||
|
for i in range(18):
|
||||||
|
enemy = entities.CircleBarrier(self)
|
||||||
|
enemy.radius = self.random()*40+50
|
||||||
|
self.entities.append(enemy)
|
||||||
|
for i in range(0):
|
||||||
|
enemy = entities.FlyingChaser(self)
|
||||||
|
enemy.chase_acc = self.random()*0.4*0.3 # *0.6+0.5
|
||||||
|
self.entities.append(enemy)
|
||||||
|
for i in range(1):
|
||||||
|
reward = entities.TeleportingReward(self)
|
||||||
|
self.entities.append(reward)
|
||||||
|
|
||||||
|
|
||||||
|
class ColumbusDemoEnv2_7(ColumbusEnv):
|
||||||
|
def __init__(self, observable=observables.Observable(), fps=30, aux_reward_max=1, **kw):
|
||||||
|
super().__init__(
|
||||||
|
observable=observable, fps=fps, env_seed=2.7, aux_reward_max=aux_reward_max, controll_type='ACC', agent_drag=0.05, **kw)
|
||||||
|
self.start_pos = [0.6, 0.3]
|
||||||
|
self.score = 0
|
||||||
|
|
||||||
|
def setup(self):
|
||||||
|
self.agent.pos = self.start_pos
|
||||||
|
for i in range(12):
|
||||||
|
enemy = entities.CircleBarrier(self)
|
||||||
|
enemy.radius = self.random()*30+40
|
||||||
|
self.entities.append(enemy)
|
||||||
|
for i in range(3):
|
||||||
|
enemy = entities.FlyingChaser(self)
|
||||||
|
enemy.chase_acc = self.random()*0.4*0.3 # *0.6+0.5
|
||||||
|
self.entities.append(enemy)
|
||||||
|
for i in range(1):
|
||||||
|
reward = entities.TeleportingReward(self)
|
||||||
|
self.entities.append(reward)
|
||||||
|
|
||||||
|
|
||||||
|
class ColumbusDemoEnvFootball(ColumbusEnv):
|
||||||
|
def __init__(self, observable=observables.Observable(), fps=30, walkingOpponent=0, flyingOpponent=0, **kw):
|
||||||
|
super().__init__(
|
||||||
|
observable=observable, fps=fps, env_seed=1.23, **kw)
|
||||||
|
self.start_pos = [0.5, 0.5]
|
||||||
|
self.score = 0
|
||||||
|
self.walkingOpponents = walkingOpponent
|
||||||
|
self.flyingOpponents = flyingOpponent
|
||||||
|
|
||||||
|
def setup(self):
|
||||||
|
self.agent.pos = self.start_pos
|
||||||
|
for i in range(8):
|
||||||
|
enemy = entities.CircleBarrier(self)
|
||||||
|
enemy.radius = self.random()*40+50
|
||||||
|
self.entities.append(enemy)
|
||||||
|
ball = entities.Ball(self)
|
||||||
|
self.entities.append(ball)
|
||||||
|
self.entities.append(entities.TeleportingGoal(self))
|
||||||
|
for i in range(self.walkingOpponents):
|
||||||
|
self.entities.append(entities.WalkingFootballPlayer(self, ball))
|
||||||
|
for i in range(self.flyingOpponents):
|
||||||
|
self.entities.append(entities.FlyingFootballPlayer(self, ball))
|
||||||
|
|
||||||
|
|
||||||
class ColumbusCandyland(ColumbusEnv):
|
class ColumbusCandyland(ColumbusEnv):
|
||||||
def __init__(self, observable=observables.RayObservable(chans=[entities.Reward, entities.Void], num_rays=16, include_rand=True), hide_map=False, fps=30, env_seed=None, **kw):
|
def __init__(self, observable=observables.RayObservable(chans=[entities.Reward, entities.Void], num_rays=16, include_rand=True), hide_map=False, fps=30, env_seed=None, **kw):
|
||||||
super(ColumbusCandyland, self).__init__(
|
super(ColumbusCandyland, self).__init__(
|
||||||
@ -664,7 +765,7 @@ class ColumbusConfigDefined(ColumbusEnv):
|
|||||||
|
|
||||||
|
|
||||||
class ColumbusBlub(ColumbusEnv):
|
class ColumbusBlub(ColumbusEnv):
|
||||||
def __init__(self, observable=observables.Observable(), env_seed=None, entities=[], fps=30, **kw):
|
def __init__(self, observable=observables.CompositionalObservable([observables.StateObservable(), observables.RayObservable(num_rays=6, chans=[entities.Enemy])]), env_seed=None, entities=[], fps=30, **kw):
|
||||||
super().__init__(
|
super().__init__(
|
||||||
observable=observable, fps=fps, env_seed=env_seed, default_collision_elasticity=0.8, speed_fac=0.01, acc_fac=0.1, agent_drag=0.06, controll_type='ACC')
|
observable=observable, fps=fps, env_seed=env_seed, default_collision_elasticity=0.8, speed_fac=0.01, acc_fac=0.1, agent_drag=0.06, controll_type='ACC')
|
||||||
|
|
||||||
@ -682,11 +783,11 @@ class ColumbusBlub(ColumbusEnv):
|
|||||||
|
|
||||||
|
|
||||||
###
|
###
|
||||||
register(
|
# register(
|
||||||
id='ColumbusBlub-v0',
|
# id='ColumbusBlub-v0',
|
||||||
entry_point=ColumbusBlub,
|
# entry_point=ColumbusBlub,
|
||||||
max_episode_steps=30*60*2,
|
# max_episode_steps=30*60*2,
|
||||||
)
|
# )
|
||||||
|
|
||||||
|
|
||||||
register(
|
register(
|
||||||
@ -701,41 +802,41 @@ register(
|
|||||||
max_episode_steps=30*60*2,
|
max_episode_steps=30*60*2,
|
||||||
)
|
)
|
||||||
|
|
||||||
register(
|
# register(
|
||||||
id='ColumbusRayDrone-v0',
|
# id='ColumbusRayDrone-v0',
|
||||||
entry_point=ColumbusRayDrone,
|
# entry_point=ColumbusRayDrone,
|
||||||
max_episode_steps=30*60*2,
|
# max_episode_steps=30*60*2,
|
||||||
)
|
# )
|
||||||
|
|
||||||
register(
|
# register(
|
||||||
id='ColumbusCandyland-v0',
|
# id='ColumbusCandyland-v0',
|
||||||
entry_point=ColumbusCandyland,
|
# entry_point=ColumbusCandyland,
|
||||||
max_episode_steps=30*60*2,
|
# max_episode_steps=30*60*2,
|
||||||
)
|
# )
|
||||||
|
|
||||||
register(
|
# register(
|
||||||
id='ColumbusCandyland_Aux10-v0',
|
# id='ColumbusCandyland_Aux10-v0',
|
||||||
entry_point=ColumbusCandyland_Aux10,
|
# entry_point=ColumbusCandyland_Aux10,
|
||||||
max_episode_steps=30*60*2,
|
# max_episode_steps=30*60*2,
|
||||||
)
|
# )
|
||||||
|
|
||||||
register(
|
# register(
|
||||||
id='ColumbusEasyObstacles-v0',
|
# id='ColumbusEasyObstacles-v0',
|
||||||
entry_point=ColumbusEasyObstacles,
|
# entry_point=ColumbusEasyObstacles,
|
||||||
max_episode_steps=30*60*2,
|
# max_episode_steps=30*60*2,
|
||||||
)
|
# )
|
||||||
|
|
||||||
register(
|
# register(
|
||||||
id='ColumbusEasierObstacles-v0',
|
# id='ColumbusEasierObstacles-v0',
|
||||||
entry_point=ColumbusEasyObstacles,
|
# entry_point=ColumbusEasyObstacles,
|
||||||
max_episode_steps=30*60*2,
|
# max_episode_steps=30*60*2,
|
||||||
)
|
# )
|
||||||
|
|
||||||
register(
|
# register(
|
||||||
id='ColumbusJustState-v0',
|
# id='ColumbusJustState-v0',
|
||||||
entry_point=ColumbusJustState,
|
# entry_point=ColumbusJustState,
|
||||||
max_episode_steps=30*60*2,
|
# max_episode_steps=30*60*2,
|
||||||
)
|
# )
|
||||||
|
|
||||||
register(
|
register(
|
||||||
id='ColumbusStateWithBarriers-v0',
|
id='ColumbusStateWithBarriers-v0',
|
||||||
@ -743,38 +844,54 @@ register(
|
|||||||
max_episode_steps=30*60*2,
|
max_episode_steps=30*60*2,
|
||||||
)
|
)
|
||||||
|
|
||||||
register(
|
# register(
|
||||||
id='ColumbusCompassWithBarriers-v0',
|
# id='ColumbusCompassWithBarriers-v0',
|
||||||
entry_point=ColumbusCompassWithBarriers,
|
# entry_point=ColumbusCompassWithBarriers,
|
||||||
max_episode_steps=30*60*2,
|
# max_episode_steps=30*60*2,
|
||||||
)
|
# )
|
||||||
|
|
||||||
register(
|
# register(
|
||||||
id='ColumbusTrivialRay-v0',
|
# id='ColumbusTrivialRay-v0',
|
||||||
entry_point=ColumbusTrivialRay,
|
# entry_point=ColumbusTrivialRay,
|
||||||
max_episode_steps=30*60*2,
|
# max_episode_steps=30*60*2,
|
||||||
)
|
# )
|
||||||
|
|
||||||
register(
|
# register(
|
||||||
id='ColumbusFootball-v0',
|
# id='ColumbusFootball-v0',
|
||||||
entry_point=ColumbusFootball,
|
# entry_point=ColumbusFootball,
|
||||||
max_episode_steps=30*60*2,
|
# max_episode_steps=30*60*2,
|
||||||
)
|
# )
|
||||||
|
|
||||||
register(
|
# register(
|
||||||
id='ColumbusComb-v0',
|
# id='ColumbusComb-v0',
|
||||||
entry_point=ColumbusComp,
|
# entry_point=ColumbusComp,
|
||||||
max_episode_steps=30*60*2,
|
# max_episode_steps=30*60*2,
|
||||||
)
|
# )
|
||||||
|
|
||||||
register(
|
# register(
|
||||||
id='ColumbusSingle-v0',
|
# id='ColumbusSingle-v0',
|
||||||
entry_point=ColumbusSingle,
|
# entry_point=ColumbusSingle,
|
||||||
max_episode_steps=30*60*2,
|
# max_episode_steps=30*60*2,
|
||||||
)
|
# )
|
||||||
|
|
||||||
register(
|
register(
|
||||||
id='ColumbusConfigDefined-v0',
|
id='ColumbusConfigDefined-v0',
|
||||||
entry_point=ColumbusConfigDefined,
|
entry_point=ColumbusConfigDefined,
|
||||||
max_episode_steps=30*60*2,
|
max_episode_steps=30*60*2,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
register(
|
||||||
|
id='ColumbusDemoEnvFootball-v0',
|
||||||
|
entry_point=ColumbusDemoEnvFootball,
|
||||||
|
max_episode_steps=30*60*2,
|
||||||
|
)
|
||||||
|
register(
|
||||||
|
id='ColumbusDemoEnv3_1-v0',
|
||||||
|
entry_point=ColumbusDemoEnv3_1,
|
||||||
|
max_episode_steps=30*60*2,
|
||||||
|
)
|
||||||
|
register(
|
||||||
|
id='ColumbusDemoEnv2_7-v0',
|
||||||
|
entry_point=ColumbusDemoEnv2_7,
|
||||||
|
max_episode_steps=30*60*2,
|
||||||
|
)
|
||||||
|
@ -48,7 +48,7 @@ class CnnObservable(Observable):
|
|||||||
|
|
||||||
def get_observation(self):
|
def get_observation(self):
|
||||||
if not self.env._rendered:
|
if not self.env._rendered:
|
||||||
self.env.render(dont_show=True)
|
self.env.render(mode='internal', dont_show=False)
|
||||||
self.env._ensure_surface()
|
self.env._ensure_surface()
|
||||||
x, y = self.env.agent.pos[0]*self.env.width - self.in_width / \
|
x, y = self.env.agent.pos[0]*self.env.width - self.in_width / \
|
||||||
2, self.env.agent.pos[1]*self.env.height - self.in_height/2
|
2, self.env.agent.pos[1]*self.env.height - self.in_height/2
|
||||||
|
Loading…
Reference in New Issue
Block a user