26 lines
418 B
YAML
26 lines
418 B
YAML
policy:
|
|
input_dim: 4
|
|
output_dim: 2
|
|
hidden_sizes: [64, 64]
|
|
|
|
ppo:
|
|
learning_rate: 3e-4
|
|
n_steps: 2048
|
|
batch_size: 64
|
|
n_epochs: 10
|
|
gamma: 0.99
|
|
gae_lambda: 0.95
|
|
clip_range: 0.2
|
|
total_timesteps: 1000000
|
|
eval_interval: 2048
|
|
eval_deterministic: true
|
|
eval_episodes: 10
|
|
seed: 42
|
|
|
|
loggers:
|
|
- type: terminal
|
|
- type: wandb
|
|
project: "PPO_project"
|
|
entity: "your_entity"
|
|
push_interval: 10
|