Slate/example.yaml

146 lines
2.0 KiB
YAML
Raw Normal View History

2023-07-05 15:02:53 +02:00
name: DEFAULT
2023-07-05 19:29:51 +02:00
vars:
foo: bar
2023-07-05 15:02:53 +02:00
slurm:
2023-07-06 15:59:14 +02:00
name: PerlinExp_Slate_DR# '{config[name]}'
2023-07-05 19:29:51 +02:00
partitions:
- SINGLE
num_parallel_jobs: 50
cpus_per_task: 1
2023-07-05 15:02:53 +02:00
mem-per-cpu: 3000
time: 1440 # in minutes
2023-07-05 19:29:51 +02:00
ntasks: 1
sh_lines: ['']
2023-07-06 15:59:14 +02:00
runner: sb3
2023-07-05 15:02:53 +02:00
2023-07-05 19:29:51 +02:00
scheduler:
2023-07-05 21:18:57 +02:00
total_timesteps: 10000
2023-07-05 19:29:51 +02:00
repetitions: 3
agents_per_job: 3
reps_per_agent: 1
2023-09-02 19:55:35 +02:00
bind_agent_to_core: True
2023-07-05 15:02:53 +02:00
2023-07-05 19:29:51 +02:00
wandb:
project: '{config[name]}'
sync_tensorboard: True
monitor_gym: True
save_code: False
2023-07-05 15:02:53 +02:00
video:
enable: True
length: 3000
frequency: 100
test:
2023-07-06 15:59:14 +02:00
enable: False
2023-07-05 15:02:53 +02:00
length: 3000
frequency: 100 # 32 # 10
deterministic: Both
num_envs: 1
env:
name: BoxPushingDense-v0
legacy_fancy: True
normalize_obs: True
normalize_rew: True
num_envs: 1
env_args:
2023-07-05 19:29:51 +02:00
more_obs: True
2023-07-05 15:02:53 +02:00
algo:
name: PPO
policy_name: MlpPolicy
n_steps: 4096
vf_coef: 1.0e-5
learning_rate: 5.0e-5
batch_size: 512
action_coef: 0
ent_coef: 0
normalize_advantage: False # True
pca:
enable: False
window: 64
skip_conditioning: True
Base_Noise: WHITE
init_std: 1.0
2023-07-05 21:18:57 +02:00
2023-07-05 15:02:53 +02:00
sweep:
2023-07-05 21:18:57 +02:00
enable: False
method: random
#metric:
# goal: minimize
# name: score
2023-07-05 15:02:53 +02:00
parameters:
2023-07-05 21:18:57 +02:00
algo.learning_rate:
min: 0.0001
max: 0.1
---
name: sweep
import: $
sweep.enable: True
scheduler.reps_per_agent: 3
---
name: McNamo
import: :DEFAULT
video:
length: 10
env:
env_args:
more_obs: False
algo.name: TRPL
leaf: False
---
name: Leaf
vars:
leaf: True
---
name: Weird
import: :McNamo,:Leaf
leaf: True
2023-07-05 15:02:53 +02:00
---
name: Test_BaseTest
project: JustTesting
runner: printConfig
wandb:
group: 'base'
job_type: '{delta_desc}'
---
name: Test_Sweep
project: JustTesting
runner: printConfig
scheduler:
repetitions: 16
wandb:
group: 'sweep'
job_type: '{delta_desc}'
A: 'dA'
B: 'dB'
C: 'dC'
grid:
A: ['gA1', 'gA2']
# B: ['gB1', 'gB2']
2023-07-05 15:02:53 +02:00
ablative:
2023-07-29 22:04:54 +02:00
C: ['aC1', 'aC2']
---
name: Test_CTR
project: JustTesting
runner: printConfig
scheduler:
repetitions: 16
reps_per_agent: 2
agents_per_job: 2
wandb:
group: 'ctr'
job_type: '{delta_desc}'
CTR: 0
ablative:
CTR: [1,2,3,4,5,6,7,8,9,10]