How to pass customized environment with customized preprocessor

Giang_Ha · July 17, 2021, 3:34am

Hi, I would like to config an environment for Mario Game like the one in the pytorch RL tutorial (Train a Mario-playing RL Agent — PyTorch Tutorials 1.9.0+cu102 documentation). It has several customized preprocessors. How could I adapt it to RLlib? Thanks for your help. Below is some code that Torch use:

import gym
from gym.spaces import Box
from gym.wrappers import FrameStack
from nes_py.wrappers import JoypadSpace
import gym_super_mario_bros

class SkipFrame(gym.Wrapper):
    def __init__(self, env, skip):
        """Return only every `skip`-th frame"""
        super().__init__(env)
        self._skip = skip

    def step(self, action):
        """Repeat action, and sum reward"""
        total_reward = 0.0
        done = False
        for i in range(self._skip):
            # Accumulate reward and repeat the same action
            obs, reward, done, info = self.env.step(action)
            total_reward += reward
            if done:
                break
        return obs, total_reward, done, info


class GrayScaleObservation(gym.ObservationWrapper):
    def __init__(self, env):
        super().__init__(env)
        obs_shape = self.observation_space.shape[:2]
        self.observation_space = Box(low=0, high=255, shape=obs_shape, dtype=np.uint8)

    def permute_orientation(self, observation):
        # permute [H, W, C] array to [C, H, W] tensor
        observation = np.transpose(observation, (2, 0, 1))
        observation = torch.tensor(observation.copy(), dtype=torch.float)
        return observation

    def observation(self, observation):
        observation = self.permute_orientation(observation)
        transform = T.Grayscale()
        observation = transform(observation)
        return observation


class ResizeObservation(gym.ObservationWrapper):
    def __init__(self, env, shape):
        super().__init__(env)
        if isinstance(shape, int):
            self.shape = (shape, shape)
        else:
            self.shape = tuple(shape)

        obs_shape = self.shape + self.observation_space.shape[2:]
        self.observation_space = Box(low=0, high=255, shape=obs_shape, dtype=np.uint8)

    def observation(self, observation):
        transforms = T.Compose(
            [T.Resize(self.shape), T.Normalize(0, 255)]
        )
        observation = transforms(observation).squeeze(0)
        return observation

env = gym_super_mario_bros.make("SuperMarioBros-1-1-v0")
env = JoypadSpace(env, [["right"], ["right", "A"]])
env = SkipFrame(env, skip=4)
env = GrayScaleObservation(env)
env = ResizeObservation(env, shape=84)
env = FrameStack(env, num_stack=4)

mannyv · July 17, 2021, 11:06am

Hi @Giang_Ha,

I think the most straightforward was to do that is just like this example does:

github.com

ray-project/ray/blob/9da49a7fb85b95cc1ed2006434ab240840cb8210/rllib/examples/pettingzoo_env.py#L25

    
      
          1. Algorithm name and according module, e.g.: "PPo" + agents.ppo as agent
          2. Name of the aec game you want to train on, e.g.: "pistonball".
          3. num_cpus
          4. num_rollouts
          
          
Does require SuperSuit
          """
          alg_name = "PPO"
          
          
# Function that outputs the environment you wish to register.
          def env_creator(config):
              env = pistonball_v4.env(local_ratio=config.get("local_ratio", 0.2))
              env = dtype_v0(env, dtype=float32)
              env = color_reduction_v0(env, mode="R")
              env = normalize_obs_v0(env)
              return env
          
          
num_cpus = 1
          num_rollouts = 2
          
          
# Gets default training configuration and specifies the POMgame to load.

Topic		Replies	Views
Use gym.wrappers for Training RLlib	5	1599	January 12, 2022
Atari Preprocessors for Atari-like environments RLlib	0	340	June 12, 2021
Model doesn't recognize ObservationWrapper and keeps using orig_observation RLlib	4	355	October 7, 2022
Custom preprocessors and original_space variable RLlib	4	1027	March 15, 2021
How to use gym environment that require an individual python process with RLLIB? RLlib	1	420	January 25, 2021

How to pass customized environment with customized preprocessor

Related topics