stable-baselines3/stable_baselines3/common/vec_env/util.py

75 lines
2.8 KiB
Python
Raw Normal View History

2019-09-20 13:18:25 +00:00
"""
Helpers for dealing with vectorized environments.
"""
from collections import OrderedDict
from typing import Any, Dict, List, Tuple
2019-09-20 13:18:25 +00:00
import gym
import numpy as np
from stable_baselines3.common.vec_env.base_vec_env import VecEnvObs
2019-09-20 13:18:25 +00:00
def copy_obs_dict(obs: Dict[str, np.ndarray]) -> Dict[str, np.ndarray]:
2019-09-20 13:18:25 +00:00
"""
Deep-copy a dict of numpy arrays.
:param obs: a dict of numpy arrays.
:return: a dict of copied numpy arrays.
2019-09-20 13:18:25 +00:00
"""
2020-01-22 15:39:25 +00:00
assert isinstance(obs, OrderedDict), f"unexpected type for observations '{type(obs)}'"
2019-09-20 13:18:25 +00:00
return OrderedDict([(k, np.copy(v)) for k, v in obs.items()])
def dict_to_obs(space: gym.spaces.Space, obs_dict: Dict[Any, np.ndarray]) -> VecEnvObs:
2019-09-20 13:18:25 +00:00
"""
Convert an internal representation raw_obs into the appropriate type
specified by space.
:param space: an observation space.
:param obs_dict: a dict of numpy arrays.
:return: returns an observation of the same type as space.
If space is Dict, function is identity; if space is Tuple, converts dict to Tuple;
otherwise, space is unstructured and returns the value raw_obs[None].
2019-09-20 13:18:25 +00:00
"""
if isinstance(space, gym.spaces.Dict):
return obs_dict
elif isinstance(space, gym.spaces.Tuple):
assert len(obs_dict) == len(space.spaces), "size of observation does not match size of observation space"
return tuple((obs_dict[i] for i in range(len(space.spaces))))
else:
assert set(obs_dict.keys()) == {None}, "multiple observation keys for unstructured observation space"
return obs_dict[None]
def obs_space_info(obs_space: gym.spaces.Space) -> Tuple[List[str], Dict[Any, Tuple[int, ...]], Dict[Any, np.dtype]]:
2019-09-20 13:18:25 +00:00
"""
Get dict-structured information about a gym.Space.
Dict spaces are represented directly by their dict of subspaces.
Tuple spaces are converted into a dict with keys indexing into the tuple.
Unstructured spaces are represented by {None: obs_space}.
:param obs_space: an observation space
:return: A tuple (keys, shapes, dtypes):
2019-09-20 13:18:25 +00:00
keys: a list of dict keys.
shapes: a dict mapping keys to shapes.
dtypes: a dict mapping keys to dtypes.
"""
if isinstance(obs_space, gym.spaces.Dict):
assert isinstance(obs_space.spaces, OrderedDict), "Dict space must have ordered subspaces"
subspaces = obs_space.spaces
elif isinstance(obs_space, gym.spaces.Tuple):
subspaces = {i: space for i, space in enumerate(obs_space.spaces)}
else:
assert not hasattr(obs_space, "spaces"), f"Unsupported structured space '{type(obs_space)}'"
2019-09-20 13:18:25 +00:00
subspaces = {None: obs_space}
keys = []
shapes = {}
dtypes = {}
for key, box in subspaces.items():
keys.append(key)
shapes[key] = box.shape
dtypes[key] = box.dtype
return keys, shapes, dtypes