Fix: Set initial logging std correctly
This commit is contained in:
parent
a7cbc660e0
commit
3c81a15630
@ -817,7 +817,7 @@ class Actor(BasePolicy):
|
|||||||
self.mu, self.log_std = self.action_dist.proba_distribution_net(
|
self.mu, self.log_std = self.action_dist.proba_distribution_net(
|
||||||
latent_dim=last_layer_dim, return_log_std=True
|
latent_dim=last_layer_dim, return_log_std=True
|
||||||
)
|
)
|
||||||
self._remember_log_std = log_std_init
|
self._remember_log_std = th.Tensor([log_std_init])
|
||||||
# Avoid numerical issues by limiting the mean of the Gaussian
|
# Avoid numerical issues by limiting the mean of the Gaussian
|
||||||
# to be in [-clip_mean, clip_mean]
|
# to be in [-clip_mean, clip_mean]
|
||||||
if clip_mean > 0.0:
|
if clip_mean > 0.0:
|
||||||
|
Loading…
Reference in New Issue
Block a user