diff --git a/sbBrix/common/policies.py b/sbBrix/common/policies.py index 9e06244..a01c431 100644 --- a/sbBrix/common/policies.py +++ b/sbBrix/common/policies.py @@ -815,7 +815,7 @@ class Actor(BasePolicy): action_dim, **dist_kwargs ) self.mu, self.log_std = self.action_dist.proba_distribution_net( - latent_dim=last_layer_dim, return_log_std=True, **dist_kwargs + latent_dim=last_layer_dim, return_log_std=True ) self._remember_log_std = log_std_init # Avoid numerical issues by limiting the mean of the Gaussian