doorkey.py 2.3 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091
  1. from gym_minigrid.minigrid import *
  2. from gym_minigrid.register import register
  3. class DoorKeyEnv(MiniGridEnv):
  4. """
  5. Environment with a door and key, sparse reward
  6. """
  7. def __init__(self, size=8):
  8. super().__init__(gridSize=size, maxSteps=4 * size)
  9. def _genGrid(self, width, height):
  10. # Create an empty grid
  11. grid = Grid(width, height)
  12. # Place walls around the edges
  13. for i in range(0, width):
  14. grid.set(i, 0, Wall())
  15. grid.set(i, height - 1, Wall())
  16. for j in range(0, height):
  17. grid.set(0, j, Wall())
  18. grid.set(height - 1, j, Wall())
  19. # Place a goal in the bottom-right corner
  20. grid.set(width - 2, height - 2, Goal())
  21. # Create a vertical splitting wall
  22. splitIdx = self._randInt(2, width-2)
  23. for i in range(0, height):
  24. grid.set(splitIdx, i, Wall())
  25. # Place the agent at a random position and orientation
  26. self.startPos = self._randPos(
  27. 1, splitIdx,
  28. 1, height-1
  29. )
  30. self.startDir = self._randInt(0, 4)
  31. # Place a door in the wall
  32. doorIdx = self._randInt(1, width-2)
  33. grid.set(splitIdx, doorIdx, LockedDoor('yellow'))
  34. # Place a yellow key on the left side
  35. while True:
  36. pos = self._randPos(
  37. 1, splitIdx,
  38. 1, height-1
  39. )
  40. if pos == self.startPos:
  41. continue
  42. if grid.get(*pos) != None:
  43. continue
  44. grid.set(*pos, Key('yellow'))
  45. break
  46. self.mission = "use the key to open the door and then get to the goal"
  47. return grid
  48. class DoorKeyEnv5x5(DoorKeyEnv):
  49. def __init__(self):
  50. super().__init__(size=5)
  51. class DoorKeyEnv6x6(DoorKeyEnv):
  52. def __init__(self):
  53. super().__init__(size=6)
  54. class DoorKeyEnv16x16(DoorKeyEnv):
  55. def __init__(self):
  56. super().__init__(size=16)
  57. register(
  58. id='MiniGrid-DoorKey-5x5-v0',
  59. entry_point='gym_minigrid.envs:DoorKeyEnv5x5'
  60. )
  61. register(
  62. id='MiniGrid-DoorKey-6x6-v0',
  63. entry_point='gym_minigrid.envs:DoorKeyEnv6x6'
  64. )
  65. register(
  66. id='MiniGrid-DoorKey-8x8-v0',
  67. entry_point='gym_minigrid.envs:DoorKeyEnv'
  68. )
  69. register(
  70. id='MiniGrid-DoorKey-16x16-v0',
  71. entry_point='gym_minigrid.envs:DoorKeyEnv16x16'
  72. )