diff --git a/sbBrix/common/off_policy_algorithm.py b/sbBrix/common/off_policy_algorithm.py index 4d5e0dd..816d033 100644 --- a/sbBrix/common/off_policy_algorithm.py +++ b/sbBrix/common/off_policy_algorithm.py @@ -85,6 +85,7 @@ class BetterOffPolicyAlgorithm(OffPolicyAlgorithm): ): assert not (use_sde and use_pca) self.use_pca = use_pca + policy_kwargs["use_pca"] = self.use_pca super().__init__( policy=policy, env=env,