diff --git a/run_tensorboard.sh b/run_tensorboard.sh index 9623ac9..5197275 100755 --- a/run_tensorboard.sh +++ b/run_tensorboard.sh @@ -1,2 +1,2 @@ #!/bin/bash -tensorboard --logdir logs_tb/test +tensorboard --logdir logs_tb diff --git a/sb3_trl/trl_pg/__pycache__/trl_pg.cpython-310.pyc b/sb3_trl/trl_pg/__pycache__/trl_pg.cpython-310.pyc index cd40828..37e5875 100644 Binary files a/sb3_trl/trl_pg/__pycache__/trl_pg.cpython-310.pyc and b/sb3_trl/trl_pg/__pycache__/trl_pg.cpython-310.pyc differ diff --git a/sb3_trl/trl_pg/trl_pg.py b/sb3_trl/trl_pg/trl_pg.py index 9f524e6..1d813f5 100644 --- a/sb3_trl/trl_pg/trl_pg.py +++ b/sb3_trl/trl_pg/trl_pg.py @@ -322,7 +322,7 @@ class TRL_PG(OnPolicyAlgorithm): eval_env: Optional[GymEnv] = None, eval_freq: int = -1, n_eval_episodes: int = 5, - tb_log_name: str = "PPO", + tb_log_name: str = "TRL_PG", eval_log_path: Optional[str] = None, reset_num_timesteps: bool = True, ) -> "TRL_PG": diff --git a/test.py b/test.py index 9bfa910..dbe7a53 100644 --- a/test.py +++ b/test.py @@ -19,6 +19,7 @@ def main(): "MlpPolicy", env, verbose=0, + tensorboard_log="./logs_tb/test/", ) trl = TRL_PG( "MlpPolicy",