LunarLanderContinuous-v2 is our new default test-env
This commit is contained in:
parent
cf5a2e82fc
commit
60c954c8c1
10
test.py
10
test.py
@ -17,7 +17,7 @@ import columbus
|
|||||||
root_path = '.'
|
root_path = '.'
|
||||||
|
|
||||||
|
|
||||||
def main(env_name='ColumbusCandyland_Aux10-v0', timesteps=5000, showRes=False, saveModel=True, n_eval_episodes=8):
|
def main(env_name='ColumbusCandyland_Aux10-v0', timesteps=50000, showRes=False, saveModel=True, n_eval_episodes=16):
|
||||||
env = gym.make(env_name)
|
env = gym.make(env_name)
|
||||||
test_sde = False
|
test_sde = False
|
||||||
ppo = PPO(
|
ppo = PPO(
|
||||||
@ -87,12 +87,12 @@ def main(env_name='ColumbusCandyland_Aux10-v0', timesteps=5000, showRes=False, s
|
|||||||
# learning_rate=0.001 # 0.015
|
# learning_rate=0.001 # 0.015
|
||||||
# )
|
# )
|
||||||
|
|
||||||
print('PPO:')
|
|
||||||
testModel(ppo, timesteps, showRes,
|
|
||||||
saveModel, n_eval_episodes)
|
|
||||||
print('TRL_PG:')
|
print('TRL_PG:')
|
||||||
testModel(trl_pg, timesteps, showRes,
|
testModel(trl_pg, timesteps, showRes,
|
||||||
saveModel, n_eval_episodes)
|
saveModel, n_eval_episodes)
|
||||||
|
print('PPO:')
|
||||||
|
testModel(ppo, timesteps, showRes,
|
||||||
|
saveModel, n_eval_episodes)
|
||||||
|
|
||||||
|
|
||||||
def testModel(model, timesteps, showRes=False, saveModel=False, n_eval_episodes=16):
|
def testModel(model, timesteps, showRes=False, saveModel=False, n_eval_episodes=16):
|
||||||
@ -131,4 +131,4 @@ def testModel(model, timesteps, showRes=False, saveModel=False, n_eval_episodes=
|
|||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
main('CartPole-v1')
|
main('LunarLanderContinuous-v2')
|
||||||
|
Loading…
Reference in New Issue
Block a user