fancy_gym/dmp_pd_control_example.py

28 lines
651 B
Python
Raw Normal View History

2021-02-15 09:03:19 +01:00
from alr_envs.mujoco.ball_in_a_cup.utils import make_simple_env
from alr_envs.utils.dmp_async_vec_env import DmpAsyncVectorEnv
2021-02-05 17:10:03 +01:00
import numpy as np
if __name__ == "__main__":
2021-02-17 17:48:05 +01:00
dim = 15
2021-02-15 09:03:19 +01:00
n_cpus = 4
2021-03-22 15:28:50 +01:00
n_samples = 10
2021-02-15 09:03:19 +01:00
vec_env = DmpAsyncVectorEnv([make_simple_env(i) for i in range(n_cpus)],
n_samples=n_samples)
2021-02-17 17:48:05 +01:00
params = np.tile(1 * np.random.randn(n_samples, dim), (10, 1))
2021-02-17 17:48:05 +01:00
rewards, infos = vec_env(params)
print(rewards)
2021-02-15 09:03:19 +01:00
#
2021-02-17 17:48:05 +01:00
# non_vec_env = make_simple_env(0, 0)()
2021-02-15 09:03:19 +01:00
#
# params = 10 * np.random.randn(dim)
2021-02-05 17:10:03 +01:00
2021-02-17 17:48:05 +01:00
# out2 = non_vec_env.rollout(params, render=True)
2021-02-05 17:10:03 +01:00
2021-02-17 17:48:05 +01:00
# print(out2)