Source code for nnabla_rl.environments.environment_info

# Copyright 2020,2021 Sony Corporation.
# Copyright 2021 Sony Group Corporation.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from dataclasses import dataclass

import gym
import numpy as np


[docs]@dataclass class EnvironmentInfo(object): """Environment Information class This class contains the basic information of the target training environment. """ observation_space: gym.spaces.Space action_space: gym.spaces.Space max_episode_steps: int
[docs] @staticmethod def from_env(env): """Create env_info from environment Args: env (gym.Env): the environment Returns: EnvironmentInfo\ (:py:class:`EnvironmentInfo <nnabla_rl.environments.environment_info.EnvironmentInfo>`) Example: >>> import gym >>> from nnabla_rl.environments.environment_info import EnvironmentInfo >>> env = gym.make("CartPole-v0") >>> env_info = EnvironmentInfo.from_env(env) >>> env_info.state_shape (4,) """ return EnvironmentInfo(observation_space=env.observation_space, action_space=env.action_space, max_episode_steps=EnvironmentInfo._extract_max_episode_steps(env))
[docs] def is_discrete_action_env(self): ''' Check whether the action to execute in the environment is discrete or not Returns: bool: True if the action to execute in the environment is discrete. Otherwise False. ''' return isinstance(self.action_space, gym.spaces.Discrete)
[docs] def is_continuous_action_env(self): ''' Check whether the action to execute in the environment is continuous or not Returns: bool: True if the action to execute in the environment is continuous. Otherwise False. ''' return not self.is_discrete_action_env()
@property def state_shape(self): ''' The shape of observation space ''' return self.observation_space.shape @property def state_dim(self): ''' The dimension of state assuming that the state is flatten. ''' return np.prod(self.observation_space.shape) @property def action_shape(self): ''' The shape of action space ''' return self.action_space.shape @property def action_dim(self): ''' The dimension of action assuming that the action is flatten. ''' if self.is_discrete_action_env(): return self.action_space.n else: return np.prod(self.action_space.shape) @staticmethod def _extract_max_episode_steps(env): if env.spec is None or env.spec.max_episode_steps is None: return float("inf") else: return env.spec.max_episode_steps