stable-baselines3/tests/test_vec_check_nan.py

60 lines
1.4 KiB
Python
Raw Normal View History

2020-05-05 14:28:38 +00:00
import gym
import numpy as np
import pytest
from gym import spaces
2020-05-05 14:28:38 +00:00
2020-05-05 14:32:08 +00:00
from stable_baselines3.common.vec_env import DummyVecEnv, VecCheckNan
2020-05-05 14:28:38 +00:00
class NanAndInfEnv(gym.Env):
"""Custom Environment that raised NaNs and Infs"""
metadata = {"render.modes": ["human"]}
2020-05-05 14:28:38 +00:00
def __init__(self):
super().__init__()
2020-05-05 14:28:38 +00:00
self.action_space = spaces.Box(low=-np.inf, high=np.inf, shape=(1,), dtype=np.float64)
self.observation_space = spaces.Box(low=-np.inf, high=np.inf, shape=(1,), dtype=np.float64)
@staticmethod
def step(action):
if np.all(np.array(action) > 0):
obs = float("NaN")
2020-05-05 14:28:38 +00:00
elif np.all(np.array(action) < 0):
obs = float("inf")
2020-05-05 14:28:38 +00:00
else:
obs = 0
return [obs], 0.0, False, {}
@staticmethod
def reset():
return [0.0]
def render(self, mode="human", close=False):
2020-05-05 14:28:38 +00:00
pass
def test_check_nan():
"""Test VecCheckNan Object"""
env = DummyVecEnv([NanAndInfEnv])
env = VecCheckNan(env, raise_exception=True)
env.step([[0]])
with pytest.raises(ValueError):
env.step([[float("NaN")]])
2020-05-05 14:28:38 +00:00
with pytest.raises(ValueError):
env.step([[float("inf")]])
2020-05-05 14:28:38 +00:00
with pytest.raises(ValueError):
2020-05-05 14:28:38 +00:00
env.step([[-1]])
with pytest.raises(ValueError):
2020-05-05 14:28:38 +00:00
env.step([[1]])
env.step(np.array([[0, 1], [0, 1]]))
env.reset()