Better default HPs for TRPL
This commit is contained in:
parent
5b9f8b028c
commit
e3f4c511bf
@ -87,7 +87,7 @@ class TRPL(BetterOnPolicyAlgorithm):
|
||||
n_epochs: int = 10,
|
||||
gamma: float = 0.99,
|
||||
gae_lambda: float = 0.95,
|
||||
clip_range: Union[float, Schedule] = 0.2,
|
||||
clip_range: Union[float, Schedule, None] = None,
|
||||
clip_range_vf: Union[None, float, Schedule] = None,
|
||||
normalize_advantage: bool = True,
|
||||
ent_coef: float = 0.0,
|
||||
@ -169,7 +169,11 @@ class TRPL(BetterOnPolicyAlgorithm):
|
||||
)
|
||||
self.batch_size = batch_size
|
||||
self.n_epochs = n_epochs
|
||||
if clip_range == False:
|
||||
clip_range = None
|
||||
self.clip_range = clip_range
|
||||
if clip_range_vf == False:
|
||||
clip_range_vf = None
|
||||
self.clip_range_vf = clip_range_vf
|
||||
self.normalize_advantage = normalize_advantage
|
||||
self.projection = castProjection(projection)
|
||||
|
Loading…
Reference in New Issue
Block a user