| 
					
				 | 
			
			
				@@ -14,10 +14,7 @@ class GoToDoorEnv(MiniGridEnv): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         assert size >= 5 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         super().__init__(gridSize=size, maxSteps=10*size) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        self.reward_range = (-1000, 1000) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        # Flag determining whether the wait action ends the episode 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        self.waitEnds = True 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        self.reward_range = (-1, 1) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				     def _genGrid(self, width, height): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         # Create the grid 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -103,7 +100,6 @@ class GoToDoorEnv(MiniGridEnv): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         if action == self.actions.wait: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             if (ax == tx and abs(ay - ty) == 1) or (ay == ty and abs(ax - tx) == 1): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 reward = 1 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-            done = self.waitEnds 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         obs = self._observation(obs) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 |