multiroom.py 7.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234
  1. from gym_minigrid.minigrid import COLOR_NAMES, Door, Goal, Grid, MiniGridEnv, Wall
  2. from gym_minigrid.register import register
  3. class MultiRoom:
  4. def __init__(self,
  5. top,
  6. size,
  7. entryDoorPos,
  8. exitDoorPos
  9. ):
  10. self.top = top
  11. self.size = size
  12. self.entryDoorPos = entryDoorPos
  13. self.exitDoorPos = exitDoorPos
  14. class MultiRoomEnv(MiniGridEnv):
  15. """
  16. Environment with multiple rooms (subgoals)
  17. """
  18. def __init__(self, minNumRooms, maxNumRooms, maxRoomSize=10, **kwargs):
  19. assert minNumRooms > 0
  20. assert maxNumRooms >= minNumRooms
  21. assert maxRoomSize >= 4
  22. self.minNumRooms = minNumRooms
  23. self.maxNumRooms = maxNumRooms
  24. self.maxRoomSize = maxRoomSize
  25. self.rooms = []
  26. super().__init__(grid_size=25, max_steps=self.maxNumRooms * 20, **kwargs)
  27. def _gen_grid(self, width, height):
  28. roomList = []
  29. # Choose a random number of rooms to generate
  30. numRooms = self._rand_int(self.minNumRooms, self.maxNumRooms + 1)
  31. while len(roomList) < numRooms:
  32. curRoomList = []
  33. entryDoorPos = (self._rand_int(0, width - 2), self._rand_int(0, width - 2))
  34. # Recursively place the rooms
  35. self._placeRoom(
  36. numRooms,
  37. roomList=curRoomList,
  38. minSz=4,
  39. maxSz=self.maxRoomSize,
  40. entryDoorWall=2,
  41. entryDoorPos=entryDoorPos,
  42. )
  43. if len(curRoomList) > len(roomList):
  44. roomList = curRoomList
  45. # Store the list of rooms in this environment
  46. assert len(roomList) > 0
  47. self.rooms = roomList
  48. # Create the grid
  49. self.grid = Grid(width, height)
  50. wall = Wall()
  51. prevDoorColor = None
  52. # For each room
  53. for idx, room in enumerate(roomList):
  54. topX, topY = room.top
  55. sizeX, sizeY = room.size
  56. # Draw the top and bottom walls
  57. for i in range(0, sizeX):
  58. self.grid.set(topX + i, topY, wall)
  59. self.grid.set(topX + i, topY + sizeY - 1, wall)
  60. # Draw the left and right walls
  61. for j in range(0, sizeY):
  62. self.grid.set(topX, topY + j, wall)
  63. self.grid.set(topX + sizeX - 1, topY + j, wall)
  64. # If this isn't the first room, place the entry door
  65. if idx > 0:
  66. # Pick a door color different from the previous one
  67. doorColors = set(COLOR_NAMES)
  68. if prevDoorColor:
  69. doorColors.remove(prevDoorColor)
  70. # Note: the use of sorting here guarantees determinism,
  71. # This is needed because Python's set is not deterministic
  72. doorColor = self._rand_elem(sorted(doorColors))
  73. entryDoor = Door(doorColor)
  74. self.grid.set(*room.entryDoorPos, entryDoor)
  75. prevDoorColor = doorColor
  76. prevRoom = roomList[idx - 1]
  77. prevRoom.exitDoorPos = room.entryDoorPos
  78. # Randomize the starting agent position and direction
  79. self.place_agent(roomList[0].top, roomList[0].size)
  80. # Place the final goal in the last room
  81. self.goal_pos = self.place_obj(Goal(), roomList[-1].top, roomList[-1].size)
  82. self.mission = "traverse the rooms to get to the goal"
  83. def _placeRoom(self, numLeft, roomList, minSz, maxSz, entryDoorWall, entryDoorPos):
  84. # Choose the room size randomly
  85. sizeX = self._rand_int(minSz, maxSz + 1)
  86. sizeY = self._rand_int(minSz, maxSz + 1)
  87. # The first room will be at the door position
  88. if len(roomList) == 0:
  89. topX, topY = entryDoorPos
  90. # Entry on the right
  91. elif entryDoorWall == 0:
  92. topX = entryDoorPos[0] - sizeX + 1
  93. y = entryDoorPos[1]
  94. topY = self._rand_int(y - sizeY + 2, y)
  95. # Entry wall on the south
  96. elif entryDoorWall == 1:
  97. x = entryDoorPos[0]
  98. topX = self._rand_int(x - sizeX + 2, x)
  99. topY = entryDoorPos[1] - sizeY + 1
  100. # Entry wall on the left
  101. elif entryDoorWall == 2:
  102. topX = entryDoorPos[0]
  103. y = entryDoorPos[1]
  104. topY = self._rand_int(y - sizeY + 2, y)
  105. # Entry wall on the top
  106. elif entryDoorWall == 3:
  107. x = entryDoorPos[0]
  108. topX = self._rand_int(x - sizeX + 2, x)
  109. topY = entryDoorPos[1]
  110. else:
  111. assert False, entryDoorWall
  112. # If the room is out of the grid, can't place a room here
  113. if topX < 0 or topY < 0:
  114. return False
  115. if topX + sizeX > self.width or topY + sizeY >= self.height:
  116. return False
  117. # If the room intersects with previous rooms, can't place it here
  118. for room in roomList[:-1]:
  119. nonOverlap = (
  120. topX + sizeX < room.top[0]
  121. or room.top[0] + room.size[0] <= topX
  122. or topY + sizeY < room.top[1]
  123. or room.top[1] + room.size[1] <= topY
  124. )
  125. if not nonOverlap:
  126. return False
  127. # Add this room to the list
  128. roomList.append(MultiRoom(
  129. (topX, topY),
  130. (sizeX, sizeY),
  131. entryDoorPos,
  132. None
  133. ))
  134. # If this was the last room, stop
  135. if numLeft == 1:
  136. return True
  137. # Try placing the next room
  138. for i in range(0, 8):
  139. # Pick which wall to place the out door on
  140. wallSet = {0, 1, 2, 3}
  141. wallSet.remove(entryDoorWall)
  142. exitDoorWall = self._rand_elem(sorted(wallSet))
  143. nextEntryWall = (exitDoorWall + 2) % 4
  144. # Pick the exit door position
  145. # Exit on right wall
  146. if exitDoorWall == 0:
  147. exitDoorPos = (topX + sizeX - 1, topY + self._rand_int(1, sizeY - 1))
  148. # Exit on south wall
  149. elif exitDoorWall == 1:
  150. exitDoorPos = (topX + self._rand_int(1, sizeX - 1), topY + sizeY - 1)
  151. # Exit on left wall
  152. elif exitDoorWall == 2:
  153. exitDoorPos = (topX, topY + self._rand_int(1, sizeY - 1))
  154. # Exit on north wall
  155. elif exitDoorWall == 3:
  156. exitDoorPos = (topX + self._rand_int(1, sizeX - 1), topY)
  157. else:
  158. assert False
  159. # Recursively create the other rooms
  160. success = self._placeRoom(
  161. numLeft - 1,
  162. roomList=roomList,
  163. minSz=minSz,
  164. maxSz=maxSz,
  165. entryDoorWall=nextEntryWall,
  166. entryDoorPos=exitDoorPos,
  167. )
  168. if success:
  169. break
  170. return True
  171. register(
  172. id='MiniGrid-MultiRoom-N2-S4-v0',
  173. entry_point='gym_minigrid.envs.multiroom:MultiRoomEnv',
  174. minNumRooms=2,
  175. maxNumRooms=2,
  176. maxRoomSize=4
  177. )
  178. register(
  179. id='MiniGrid-MultiRoom-N4-S5-v0',
  180. entry_point='gym_minigrid.envs.multiroom:MultiRoomEnv',
  181. minNumRooms=4,
  182. maxNumRooms=4,
  183. maxRoomSize=5
  184. )
  185. register(
  186. id='MiniGrid-MultiRoom-N6-v0',
  187. entry_point='gym_minigrid.envs.multiroom:MultiRoomEnv',
  188. minNumRooms=6,
  189. maxNumRooms=6
  190. )