Testing Observables
This commit is contained in:
parent
c6a58b15dd
commit
5c39be5ead
10
test.py
10
test.py
@ -24,8 +24,8 @@ def main(env_name='ColumbusCandyland_Aux10-v0', timesteps=1_000_000, showRes=Tru
|
|||||||
ppo = PPO(
|
ppo = PPO(
|
||||||
MlpPolicyPPO,
|
MlpPolicyPPO,
|
||||||
env,
|
env,
|
||||||
projection=KLProjectionLayer(trust_region_coeff=0.01),
|
projection=BaseProjectionLayer(), # KLProjectionLayer(trust_region_coeff=0.01),
|
||||||
policy_kwargs={'dist_kwargs': {'neural_strength': Strength.SCALAR, 'cov_strength': Strength.DIAG, 'parameterization_type':
|
policy_kwargs={'dist_kwargs': {'neural_strength': Strength.NONE, 'cov_strength': Strength.DIAG, 'parameterization_type':
|
||||||
ParametrizationType.NONE, 'enforce_positive_type': EnforcePositiveType.ABS, 'prob_squashing_type': ProbSquashingType.NONE}},
|
ParametrizationType.NONE, 'enforce_positive_type': EnforcePositiveType.ABS, 'prob_squashing_type': ProbSquashingType.NONE}},
|
||||||
verbose=0,
|
verbose=0,
|
||||||
tensorboard_log=root_path+"/logs_tb/" +
|
tensorboard_log=root_path+"/logs_tb/" +
|
||||||
@ -37,7 +37,7 @@ def main(env_name='ColumbusCandyland_Aux10-v0', timesteps=1_000_000, showRes=Tru
|
|||||||
ent_coef=0.1, # 0.1
|
ent_coef=0.1, # 0.1
|
||||||
vf_coef=0.5,
|
vf_coef=0.5,
|
||||||
use_sde=use_sde, # False
|
use_sde=use_sde, # False
|
||||||
clip_range=1 # 0.2,
|
clip_range=0.2 # 1 # 0.2,
|
||||||
)
|
)
|
||||||
# trl_frob = PPO(
|
# trl_frob = PPO(
|
||||||
# MlpPolicy,
|
# MlpPolicy,
|
||||||
@ -145,9 +145,9 @@ def testModel(model, timesteps, showRes=False, saveModel=False, n_eval_episodes=
|
|||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
# main('LunarLanderContinuous-v2')
|
main('LunarLanderContinuous-v2')
|
||||||
# main('ColumbusJustState-v0')
|
# main('ColumbusJustState-v0')
|
||||||
# main('ColumbusStateWithBarriers-v0')
|
# main('ColumbusStateWithBarriers-v0')
|
||||||
# full('ColumbusEasierObstacles-v0')
|
# full('ColumbusEasierObstacles-v0')
|
||||||
main('ColumbusSingle-v0')
|
# main('ColumbusSingle-v0')
|
||||||
# full('LunarLanderContinuous-v2')
|
# full('LunarLanderContinuous-v2')
|
||||||
|
Loading…
Reference in New Issue
Block a user