From 48a39d7cb9ee65230fca64f9ed346e84ff8794ee Mon Sep 17 00:00:00 2001 From: Michael Luo Date: Sun, 23 Aug 2020 03:53:08 -0700 Subject: [PATCH] [RLlib] Deepmind Control Suite Examples (#9751) --- rllib/env/dm_control_wrapper.py | 2 +- rllib/examples/env/dm_control_suite.py | 85 ++++++++++++++++++++++++++ 2 files changed, 86 insertions(+), 1 deletion(-) create mode 100644 rllib/examples/env/dm_control_suite.py diff --git a/rllib/env/dm_control_wrapper.py b/rllib/env/dm_control_wrapper.py index a9357e0f7..212bd9e9b 100644 --- a/rllib/env/dm_control_wrapper.py +++ b/rllib/env/dm_control_wrapper.py @@ -71,7 +71,7 @@ class DMCEnv(core.Env): domain_name, task_name, task_kwargs=None, - visualize_reward={}, + visualize_reward=False, from_pixels=False, height=84, width=84, diff --git a/rllib/examples/env/dm_control_suite.py b/rllib/examples/env/dm_control_suite.py new file mode 100644 index 000000000..abddc3eb9 --- /dev/null +++ b/rllib/examples/env/dm_control_suite.py @@ -0,0 +1,85 @@ +from ray.rllib.env.dm_control_wrapper import DMCEnv +import numpy as np +""" +8 Environments from Deepmind Control Suite +""" + + +def acrobot_swingup(): + return DMCEnv( + "acrobot", + "swingup", + from_pixels=True, + height=64, + width=64, + task_kwargs={"random": np.random.randint(low=0, high=1e9)}) + + +def hopper_hop(): + return DMCEnv( + "hopper", + "hop", + from_pixels=True, + height=64, + width=64, + task_kwargs={"random": np.random.randint(low=0, high=1e9)}) + + +def hopper_stand(): + return DMCEnv( + "hopper", + "stand", + from_pixels=True, + height=64, + width=64, + task_kwargs={"random": np.random.randint(low=0, high=1e9)}) + + +def cheetah_run(): + return DMCEnv( + "cheetah", + "run", + from_pixels=True, + height=64, + width=64, + task_kwargs={"random": np.random.randint(low=0, high=1e9)}) + + +def walker_run(): + return DMCEnv( + "walker", + "run", + from_pixels=True, + height=64, + width=64, + task_kwargs={"random": np.random.randint(low=0, high=1e9)}) + + +def pendulum_swingup(): + return DMCEnv( + "pendulum", + "swingup", + from_pixels=True, + height=64, + width=64, + task_kwargs={"random": np.random.randint(low=0, high=1e9)}) + + +def cartpole_swingup(): + return DMCEnv( + "cartpole", + "swingup", + from_pixels=True, + height=64, + width=64, + task_kwargs={"random": np.random.randint(low=0, high=1e9)}) + + +def humanoid_walk(): + return DMCEnv( + "humanoid", + "walk", + from_pixels=True, + height=64, + width=64, + task_kwargs={"random": np.random.randint(low=0, high=1e9)})