fixes

2023-08-22 01:01:13 +02:00 · 2023-08-22 01:01:13 +02:00 · d6c05668cb
commit d6c05668cb
parent 5739f365ab
1 changed files with 1 additions and 0 deletions
--- a/sbBrix/common/policies.py
+++ b/sbBrix/common/policies.py
@ -817,6 +817,7 @@ class Actor(BasePolicy):
            self.mu, self.log_std = self.action_dist.proba_distribution_net(
                latent_dim=last_layer_dim, return_log_std=True, **dist_kwargs
            )
            self._remember_log_std = log_std_init
            # Avoid numerical issues by limiting the mean of the Gaussian
            # to be in [-clip_mean, clip_mean]
            if clip_mean > 0.0: