parent
becb8d36e1
commit
ea7634ca42
@ -299,7 +299,7 @@ class ActorCriticPolicy(BasePolicy):
|
|||||||
values = self.value_net(latent_vf)
|
values = self.value_net(latent_vf)
|
||||||
distribution = self._get_action_dist_from_latent(latent_pi)
|
distribution = self._get_action_dist_from_latent(latent_pi)
|
||||||
if self.use_pca:
|
if self.use_pca:
|
||||||
actions = distribution.get_actions(deterministic=deterministic, traj=trajectory)
|
actions = distribution.get_actions(deterministic=deterministic, trajectory=trajectory)
|
||||||
else:
|
else:
|
||||||
actions = distribution.get_actions(deterministic=deterministic)
|
actions = distribution.get_actions(deterministic=deterministic)
|
||||||
log_prob = distribution.log_prob(actions)
|
log_prob = distribution.log_prob(actions)
|
||||||
|
Loading…
Reference in New Issue
Block a user