Fix bug when self.max_grad_norm=None

2024-01-23 13:32:38 +01:00 · 2024-01-23 13:32:38 +01:00 · 8bbb01504b
commit 8bbb01504b
parent c67f78159b
1 changed files with 3 additions and 2 deletions
--- a/metastable_baselines2/trpl/trpl.py
+++ b/metastable_baselines2/trpl/trpl.py
@ -92,7 +92,7 @@ class TRPL(BetterOnPolicyAlgorithm):
        normalize_advantage: bool = True,
        ent_coef: float = 0.0,
        vf_coef: float = 0.5,
-        max_grad_norm: float = 0.5,
+        max_grad_norm: Union[float, None] = None,
        use_sde: bool = False,
        sde_sample_freq: int = -1,
        use_pca: bool = False,
@ -306,6 +306,7 @@ class TRPL(BetterOnPolicyAlgorithm):
                self.policy.optimizer.zero_grad()
                loss.backward()
                # Clip grad norm
                if self.max_grad_norm is not None:
                    th.nn.utils.clip_grad_norm_(self.policy.parameters(), self.max_grad_norm)
                self.policy.optimizer.step()