Fix: Set initial logging std correctly

2023-08-22 01:18:44 +02:00 · 2023-08-22 01:18:44 +02:00 · 3c81a15630
commit 3c81a15630
parent a7cbc660e0
1 changed files with 1 additions and 1 deletions
--- a/sbBrix/common/policies.py
+++ b/sbBrix/common/policies.py
@ -817,7 +817,7 @@ class Actor(BasePolicy):
            self.mu, self.log_std = self.action_dist.proba_distribution_net(
                latent_dim=last_layer_dim, return_log_std=True
            )
-            self._remember_log_std = log_std_init
+            self._remember_log_std = th.Tensor([log_std_init])
            # Avoid numerical issues by limiting the mean of the Gaussian
            # to be in [-clip_mean, clip_mean]
            if clip_mean > 0.0: