7 years ago · 6db3f6bb87
--- a/gym_minigrid/envs/gotodoor.py
+++ b/gym_minigrid/envs/gotodoor.py
@@ -1,3 +1,4 @@
 
																+from gym import spaces
															
 
																 from gym_minigrid.minigrid import *
															
 
																 from gym_minigrid.register import register
															
@@ -14,6 +15,10 @@ class GoToDoorEnv(MiniGridEnv):
 
																         assert size >= 5
															
 
																         super().__init__(gridSize=size, maxSteps=10*size)
															
 
																+        self.observation_space = spaces.Dict({
															
 
																+            'image': self.observation_space
															
 
																+        })
															
 
																+
															
 
																         self.reward_range = (-1, 1)
															
 
																     def _genGrid(self, width, height):
															
--- a/gym_minigrid/wrappers.py
+++ b/gym_minigrid/wrappers.py
@@ -86,12 +86,13 @@ class FlatObsWrapper(gym.core.ObservationWrapper):
 
																         self.maxStrLen = maxStrLen
															
 
																         self.numCharCodes = 27
															
 
																-        obsSize = batch_numel = reduce(operator.mul, self.observation_space.shape, 1)
															
 
																+        imgSpace = env.observation_space.spaces['image']
															
 
																+        imgSize = reduce(operator.mul, imgSpace.shape, 1)
															
 
																         self.observation_space = spaces.Box(
															
 
																             low=0,
															
 
																             high=255,
															
 
																-            shape=obsSize + self.numCharCodes * self.maxStrLen
															
 
																+            shape=imgSize + self.numCharCodes * self.maxStrLen
															
 
																         )
															
 
																         self.cachedStr = None
															
--- a/pytorch_rl/envs.py
+++ b/pytorch_rl/envs.py
@@ -1,7 +1,7 @@
 
																 import os
															
 
																 import numpy
															
 
																 import gym
															
 
																-from gym.spaces.box import Box
															
 
																+from gym import spaces
															
 
																 try:
															
 
																     import gym_minigrid
															
@@ -15,7 +15,9 @@ def make_env(env_id, seed, rank, log_dir):
 
																         env.seed(seed + rank)
															
 
																-        #env = FlatObsWrapper(env)
															
 
																+        # Maxime: until RL code supports dict observations, squash observations into a flat vector
															
 
																+        if isinstance(env.observation_space, spaces.Dict):
															
 
																+            env = FlatObsWrapper(env)
															
 
																         # If the input has shape (W,H,3), wrap for PyTorch convolutions
															
 
																         obs_shape = env.observation_space.shape
															
@@ -30,7 +32,7 @@ class WrapPyTorch(gym.ObservationWrapper):
 
																     def __init__(self, env=None):
															
 
																         super(WrapPyTorch, self).__init__(env)
															
 
																         obs_shape = self.observation_space.shape
															
 
																-        self.observation_space = Box(
															
 
																+        self.observation_space = spaces.Box(
															
 
																             self.observation_space.low[0,0,0],
															
 
																             self.observation_space.high[0,0,0],
															
 
																             [obs_shape[2], obs_shape[1], obs_shape[0]]