.
This commit is contained in:
parent
b86498fa9a
commit
71670782b6
@ -88,7 +88,7 @@ class ActorCriticPolicy(BasePolicy):
|
|||||||
activation_fn: Type[nn.Module] = nn.Tanh,
|
activation_fn: Type[nn.Module] = nn.Tanh,
|
||||||
ortho_init: bool = True,
|
ortho_init: bool = True,
|
||||||
use_sde: bool = False,
|
use_sde: bool = False,
|
||||||
log_std_init: float = 0.0,
|
std_init: float = 1.0,
|
||||||
full_std: bool = True,
|
full_std: bool = True,
|
||||||
sde_net_arch: Optional[List[int]] = None,
|
sde_net_arch: Optional[List[int]] = None,
|
||||||
use_expln: bool = False,
|
use_expln: bool = False,
|
||||||
@ -135,7 +135,7 @@ class ActorCriticPolicy(BasePolicy):
|
|||||||
self.features_dim = self.features_extractor.features_dim
|
self.features_dim = self.features_extractor.features_dim
|
||||||
|
|
||||||
self.normalize_images = normalize_images
|
self.normalize_images = normalize_images
|
||||||
self.log_std_init = log_std_init
|
self.log_std_init = math.log(std_init)
|
||||||
# Keyword arguments for gSDE distribution
|
# Keyword arguments for gSDE distribution
|
||||||
if dist_kwargs == None:
|
if dist_kwargs == None:
|
||||||
dist_kwargs = {}
|
dist_kwargs = {}
|
||||||
|
@ -265,7 +265,7 @@ class SACPolicy(BasePolicy):
|
|||||||
net_arch: Optional[Union[List[int], Dict[str, List[int]]]] = None,
|
net_arch: Optional[Union[List[int], Dict[str, List[int]]]] = None,
|
||||||
activation_fn: Type[nn.Module] = nn.ReLU,
|
activation_fn: Type[nn.Module] = nn.ReLU,
|
||||||
use_sde: bool = False,
|
use_sde: bool = False,
|
||||||
log_std_init: float = -3,
|
std_init: float = 0.05,
|
||||||
sde_net_arch: Optional[List[int]] = None,
|
sde_net_arch: Optional[List[int]] = None,
|
||||||
use_expln: bool = False,
|
use_expln: bool = False,
|
||||||
clip_mean: float = 2.0,
|
clip_mean: float = 2.0,
|
||||||
@ -314,7 +314,7 @@ class SACPolicy(BasePolicy):
|
|||||||
|
|
||||||
sde_kwargs = {
|
sde_kwargs = {
|
||||||
"use_sde": use_sde,
|
"use_sde": use_sde,
|
||||||
"log_std_init": log_std_init,
|
"log_std_init": math.log(std_init),
|
||||||
"use_expln": use_expln,
|
"use_expln": use_expln,
|
||||||
"clip_mean": clip_mean,
|
"clip_mean": clip_mean,
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user