index.html 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634
  1. <!doctype html>
  2. <html class="no-js" lang="en">
  3. <head><meta charset="utf-8"/>
  4. <meta name="viewport" content="width=device-width,initial-scale=1"/>
  5. <meta name="color-scheme" content="light dark">
  6. <meta name="description" content="">
  7. <meta property="og:title" content="MiniGrid Documentation" />
  8. <meta property="og:type" content="website" />
  9. <meta property="og:description" content="" />
  10. <meta property="og:url" content="https://minigrid.farama.org/content/basic_usage.html" /><meta name="twitter:card" content="summary_large_image"><meta name="generator" content="Docutils 0.19: https://docutils.sourceforge.io/" />
  11. <link rel="index" title="Index" href="../../genindex/" /><link rel="search" title="Search" href="../../search/" /><link rel="next" title="List of Publications" href="../publications/" /><link rel="prev" title="Minigrid contains simple and easily configurable grid world environments to conduct Reinforcement Learning research. This library was previously known as gym-minigrid." href="../../" />
  12. <link rel="canonical" href="https://minigrid.farama.org/content/basic_usage.html" />
  13. <link rel="shortcut icon" href="../../_static/minigrid-favicon.png"/><meta name="generator" content="sphinx-5.2.3, furo 2022.09.15.dev1"/>
  14. <title>Basic Usage - MiniGrid Documentation</title>
  15. <link rel="stylesheet" type="text/css" href="../../_static/pygments.css" />
  16. <link rel="stylesheet" type="text/css" href="../../_static/styles/furo.css?digest=c36209c3579494d5f9512671edd8cd731f7c406c" />
  17. <link rel="stylesheet" type="text/css" href="../../_static/styles/furo-extensions.css?digest=57f753f2a36df4cd87bf0e4232aabc9b3cc73912" />
  18. <style>
  19. body {
  20. --color-code-background: #f8f8f8;
  21. --color-code-foreground: black;
  22. }
  23. @media not print {
  24. body[data-theme="dark"] {
  25. --color-code-background: #202020;
  26. --color-code-foreground: #d0d0d0;
  27. }
  28. @media (prefers-color-scheme: dark) {
  29. body:not([data-theme="light"]) {
  30. --color-code-background: #202020;
  31. --color-code-foreground: #d0d0d0;
  32. }
  33. }
  34. }
  35. </style></head>
  36. <body>
  37. <header class="farama-header" aria-label="Farama header">
  38. <div class="farama-header__container">
  39. <div class="farama-header__left--mobile">
  40. <label class="nav-overlay-icon" for="__navigation">
  41. <div class="visually-hidden">Toggle site navigation sidebar</div>
  42. <svg viewBox="0 0 24 24" xmlns="http://www.w3.org/2000/svg">
  43. <defs></defs>
  44. <line x1="0.5" y1="4" x2="23.5" y2="4"></line>
  45. <line x1="0.232" y1="12" x2="23.5" y2="12"></line>
  46. <line x1="0.232" y1="20" x2="23.5" y2="20"></line>
  47. </svg>
  48. <!-- <svg viewBox="0 0 24 24" viewBox="0 0 24 24" xmlns="http://www.w3.org/2000/svg">
  49. <line x1="0.5" y1="4.5" x2="23.5" y2="4.5" style="fill: none; "></line>
  50. <line x1="0.5" y1="12" x2="14" y2="12" ></line>
  51. <line x1="0.5" y1="19.5" x2="23.5" y2="19.5"></line>
  52. <polyline style="stroke-width: 0px;" points="17 7 22 12 17 17"></polyline>
  53. </svg> -->
  54. <!-- <svg viewBox="0 0 24 24" xmlns="http://www.w3.org/2000/svg" style="width:20px">
  55. <defs></defs>
  56. <rect y="1" width="22" height="22" rx="2" ry="2" style="fill: none;" x="1"></rect>
  57. <line x1="8" y1="1" x2="8" y2="23"></line>
  58. <polyline style="stroke-linecap: round; fill: none; stroke-linejoin: round;" points="13 7 17 12 13 17"></polyline>
  59. </svg> -->
  60. </label>
  61. </div>
  62. <div class="farama-header__left farama-header__center--mobile">
  63. <a href="../../">
  64. <img class="farama-header__logo only-light" src="../../_static/img/minigrid.svg" alt="Light Logo"/>
  65. <img class="farama-header__logo only-dark" src="../../_static/img/minigrid-white.svg" alt="Dark Logo"/>
  66. <span class="farama-header__title">MiniGrid Documentation</span>
  67. </a>
  68. </div>
  69. <div class="farama-header__right">
  70. <div class="farama-header-menu">
  71. <button class="farama-header-menu__btn" aria-label="Open Farama Menu" aria-expanded="false" aria-haspopup="true" aria-controls="farama-menu">
  72. <img class="farama-white-logo-invert" src="../../_static/img/farama-logo-header.svg">
  73. <svg viewBox="0 0 24 24" viewBox="0 0 24 24" xmlns="http://www.w3.org/2000/svg">
  74. <polyline style="stroke-linecap: round; stroke-linejoin: round; fill: none; stroke-width: 2px;" points="1 7 12 18 23 7"></polyline>
  75. </svg>
  76. </button>
  77. <div class="farama-header-menu-container farama-hidden" aria-hidden="true" id="farama-menu">
  78. <div class="farama-header-menu__header">
  79. <a href="https://farama.org">
  80. <img class="farama-header-menu__logo farama-white-logo-invert" src="../../_static/img/farama_solid_white.svg" alt="Farama Foundation logo">
  81. <span>Farama Foundation</span>
  82. </a>
  83. <div class="farama-header-menu-header__right">
  84. <button id="farama-close-menu">
  85. <svg viewBox="0 0 24 24" xmlns="http://www.w3.org/2000/svg" fill="none" stroke="currentColor"
  86. stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="icon-close">
  87. <line x1="3" y1="21" x2="21" y2="3"></line>
  88. <line x1="3" y1="3" x2="21" y2="21"></line>
  89. </svg>
  90. </button>
  91. </div>
  92. </div>
  93. <div class="farama-header-menu__body">
  94. <!-- Response from farama.org/api/projects.json -->
  95. </div>
  96. </div>
  97. </div>
  98. </div>
  99. </div>
  100. </header>
  101. <script>
  102. document.body.dataset.theme = localStorage.getItem("theme") || "auto";
  103. </script>
  104. <svg xmlns="http://www.w3.org/2000/svg" style="display: none;">
  105. <symbol id="svg-toc" viewBox="0 0 24 24">
  106. <title>Contents</title>
  107. <svg stroke="currentColor" fill="currentColor" stroke-width="0" viewBox="0 0 1024 1024">
  108. <path d="M408 442h480c4.4 0 8-3.6 8-8v-56c0-4.4-3.6-8-8-8H408c-4.4 0-8 3.6-8 8v56c0 4.4 3.6 8 8 8zm-8 204c0 4.4 3.6 8 8 8h480c4.4 0 8-3.6 8-8v-56c0-4.4-3.6-8-8-8H408c-4.4 0-8 3.6-8 8v56zm504-486H120c-4.4 0-8 3.6-8 8v56c0 4.4 3.6 8 8 8h784c4.4 0 8-3.6 8-8v-56c0-4.4-3.6-8-8-8zm0 632H120c-4.4 0-8 3.6-8 8v56c0 4.4 3.6 8 8 8h784c4.4 0 8-3.6 8-8v-56c0-4.4-3.6-8-8-8zM115.4 518.9L271.7 642c5.8 4.6 14.4.5 14.4-6.9V388.9c0-7.4-8.5-11.5-14.4-6.9L115.4 505.1a8.74 8.74 0 0 0 0 13.8z"/>
  109. </svg>
  110. </symbol>
  111. <symbol id="svg-menu" viewBox="0 0 24 24">
  112. <title>Menu</title>
  113. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor"
  114. stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="feather-menu">
  115. <line x1="3" y1="12" x2="21" y2="12"></line>
  116. <line x1="3" y1="6" x2="21" y2="6"></line>
  117. <line x1="3" y1="18" x2="21" y2="18"></line>
  118. </svg>
  119. </symbol>
  120. <symbol id="svg-arrow-right" viewBox="0 0 24 24">
  121. <title>Expand</title>
  122. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor"
  123. stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="feather-chevron-right">
  124. <polyline points="9 18 15 12 9 6"></polyline>
  125. </svg>
  126. </symbol>
  127. <symbol id="svg-sun" viewBox="0 0 24 24">
  128. <title>Light mode</title>
  129. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor"
  130. stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round" class="feather-sun">
  131. <circle cx="12" cy="12" r="5"></circle>
  132. <line x1="12" y1="1" x2="12" y2="3"></line>
  133. <line x1="12" y1="21" x2="12" y2="23"></line>
  134. <line x1="4.22" y1="4.22" x2="5.64" y2="5.64"></line>
  135. <line x1="18.36" y1="18.36" x2="19.78" y2="19.78"></line>
  136. <line x1="1" y1="12" x2="3" y2="12"></line>
  137. <line x1="21" y1="12" x2="23" y2="12"></line>
  138. <line x1="4.22" y1="19.78" x2="5.64" y2="18.36"></line>
  139. <line x1="18.36" y1="5.64" x2="19.78" y2="4.22"></line>
  140. </svg>
  141. </symbol>
  142. <symbol id="svg-moon" viewBox="0 0 24 24">
  143. <title>Dark mode</title>
  144. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor"
  145. stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round" class="icon-tabler-moon">
  146. <path stroke="none" d="M0 0h24v24H0z" fill="none" />
  147. <path d="M12 3c.132 0 .263 0 .393 0a7.5 7.5 0 0 0 7.92 12.446a9 9 0 1 1 -8.313 -12.454z" />
  148. </svg>
  149. </symbol>
  150. <symbol id="svg-sun-half" viewBox="0 0 24 24">
  151. <title>Auto light/dark mode</title>
  152. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor"
  153. stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round" class="icon-tabler-shadow">
  154. <path stroke="none" d="M0 0h24v24H0z" fill="none"/>
  155. <circle cx="12" cy="12" r="9" />
  156. <path d="M13 12h5" />
  157. <path d="M13 15h4" />
  158. <path d="M13 18h1" />
  159. <path d="M13 9h4" />
  160. <path d="M13 6h1" />
  161. </svg>
  162. </symbol>
  163. </svg>
  164. <input type="checkbox" class="sidebar-toggle" name="__navigation" id="__navigation">
  165. <input type="checkbox" class="sidebar-toggle" name="__toc" id="__toc">
  166. <label class="overlay sidebar-overlay" for="__navigation">
  167. <div class="visually-hidden">Hide navigation sidebar</div>
  168. </label>
  169. <label class="overlay toc-overlay" for="__toc">
  170. <div class="visually-hidden">Hide table of contents sidebar</div>
  171. </label>
  172. <div class="page">
  173. <!--<header class="mobile-header">
  174. <div class="header-left">
  175. <label class="nav-overlay-icon" for="__navigation">
  176. <div class="visually-hidden">Toggle site navigation sidebar</div>
  177. <i class="icon"><svg><use href="#svg-menu"></use></svg></i>
  178. </label>
  179. </div>
  180. <div class="header-center">
  181. <a href="../../"><div class="brand">MiniGrid Documentation</div></a>
  182. </div>
  183. <div class="header-right">
  184. <div class="theme-toggle-container theme-toggle-header">
  185. <button class="theme-toggle">
  186. <div class="visually-hidden">Toggle Light / Dark / Auto color theme</div>
  187. <svg class="theme-icon-when-auto"><use href="#svg-sun-half"></use></svg>
  188. <svg class="theme-icon-when-dark"><use href="#svg-moon"></use></svg>
  189. <svg class="theme-icon-when-light"><use href="#svg-sun"></use></svg>
  190. </button>
  191. </div>
  192. <label class="toc-overlay-icon toc-header-icon no-toc" for="__toc">
  193. <div class="visually-hidden">Toggle table of contents sidebar</div>
  194. <i class="icon"><svg><use href="#svg-toc"></use></svg></i>
  195. </label>
  196. </div>
  197. </header>-->
  198. <aside class="sidebar-drawer">
  199. <div class="sidebar-container">
  200. <div class="sidebar-sticky"><a class="farama-sidebar__title" href="../../">
  201. <img class="farama-header__logo only-light" src="../../_static/img/minigrid.svg" alt="Light Logo"/>
  202. <img class="farama-header__logo only-dark" src="../../_static/img/minigrid-white.svg" alt="Dark Logo"/>
  203. <span class="farama-header__title">MiniGrid Documentation</span>
  204. </a><form class="sidebar-search-container" method="get" action="../../search/" role="search">
  205. <input class="sidebar-search" placeholder=Search name="q" aria-label="Search">
  206. <input type="hidden" name="check_keywords" value="yes">
  207. <input type="hidden" name="area" value="default">
  208. </form>
  209. <div id="searchbox"></div><div class="sidebar-scroll"><div class="sidebar-tree">
  210. <p class="caption" role="heading"><span class="caption-text">Introduction</span></p>
  211. <ul class="current">
  212. <li class="toctree-l1 current current-page"><a class="current reference internal" href="#">Basic Usage</a></li>
  213. <li class="toctree-l1"><a class="reference internal" href="#training-an-agent">Training an Agent</a></li>
  214. <li class="toctree-l1"><a class="reference internal" href="../publications/">List of Publications</a></li>
  215. </ul>
  216. <p class="caption" role="heading"><span class="caption-text">Wrappers</span></p>
  217. <ul>
  218. <li class="toctree-l1 has-children"><a class="reference internal" href="../../api/wrapper/">Wrapper</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle child pages in navigation</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
  219. <li class="toctree-l2"><a class="reference internal" href="../../api/wrappers/">Action Bonus</a></li>
  220. <li class="toctree-l2"><a class="reference internal" href="../../api/wrappers/#dict-observation-space">Dict Observation Space</a></li>
  221. <li class="toctree-l2"><a class="reference internal" href="../../api/wrappers/#direction-obs">Direction Obs</a></li>
  222. <li class="toctree-l2"><a class="reference internal" href="../../api/wrappers/#flatobs">FlatObs</a></li>
  223. <li class="toctree-l2"><a class="reference internal" href="../../api/wrappers/#fully-obs">Fully Obs</a></li>
  224. <li class="toctree-l2"><a class="reference internal" href="../../api/wrappers/#observation">Observation</a></li>
  225. <li class="toctree-l2"><a class="reference internal" href="../../api/wrappers/#one-hot-partial-obs">One Hot Partial Obs</a></li>
  226. <li class="toctree-l2"><a class="reference internal" href="../../api/wrappers/#reseed">Reseed</a></li>
  227. <li class="toctree-l2"><a class="reference internal" href="../../api/wrappers/#rgb-img-obs">RGB Img Obs</a></li>
  228. <li class="toctree-l2"><a class="reference internal" href="../../api/wrappers/#position-bonus">Position Bonus</a></li>
  229. <li class="toctree-l2"><a class="reference internal" href="../../api/wrappers/#symbolic-obs">Symbolic Obs</a></li>
  230. <li class="toctree-l2"><a class="reference internal" href="../../api/wrappers/#view-size">View Size</a></li>
  231. </ul>
  232. </li>
  233. </ul>
  234. <p class="caption" role="heading"><span class="caption-text">Environments</span></p>
  235. <ul>
  236. <li class="toctree-l1 has-children"><a class="reference internal" href="../../environments/minigrid/">Minigrid Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle child pages in navigation</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
  237. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/BlockedUnlockPickupEnv/">Blocked Unlock Pickup</a></li>
  238. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/CrossingEnv/">Crossing</a></li>
  239. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/DistShiftEnv/">Dist Shift</a></li>
  240. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/DoorKeyEnv/">Door Key</a></li>
  241. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/DynamicObstaclesEnv/">Dynamic Obstacles</a></li>
  242. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/EmptyEnv/">Empty</a></li>
  243. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/FetchEnv/">Fetch</a></li>
  244. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/FourRoomsEnv/">Four Rooms</a></li>
  245. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/GoToDoorEnv/">Go To Door</a></li>
  246. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/GoToObjectEnv/">Go To Object</a></li>
  247. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/KeyCorridorEnv/">Key Corridor</a></li>
  248. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/LavaGapEnv/">Lava Gap</a></li>
  249. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/LockedRoomEnv/">Locked Room</a></li>
  250. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/MemoryEnv/">Memory</a></li>
  251. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/MultiRoomEnv/">Multi Room</a></li>
  252. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/ObstructedMaze_1Dlhb/">Obstructed Maze Dlhb</a></li>
  253. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/ObstructedMaze_Full/">Obstructed Maze Full</a></li>
  254. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/PlaygroundEnv/">Playground</a></li>
  255. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/PutNearEnv/">Put Near</a></li>
  256. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/RedBlueDoorEnv/">Red Blue Door</a></li>
  257. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/UnlockEnv/">Unlock</a></li>
  258. <li class="toctree-l2"><a class="reference internal" href="../../environments/minigrid/UnlockPickupEnv/">Unlock Pickup</a></li>
  259. </ul>
  260. </li>
  261. <li class="toctree-l1 has-children"><a class="reference internal" href="../../environments/babyai/">BabyAI Environments</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" role="switch" type="checkbox"/><label for="toctree-checkbox-3"><div class="visually-hidden">Toggle child pages in navigation</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
  262. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/GoToRedBallGrey/">Go To Red Ball Grey</a></li>
  263. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/GoToRedBall/">Go To Red Ball</a></li>
  264. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/GoToRedBallNoDists/">Go To Red Ball No Dists</a></li>
  265. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/GoToObj/">Go To Obj</a></li>
  266. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/GoToLocal/">Go To Local</a></li>
  267. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/GoTo/">Go To</a></li>
  268. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/GoToImpUnlock/">Go To Imp Unlock</a></li>
  269. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/GoToSeq/">Go To Seq</a></li>
  270. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/GoToRedBlueBall/">Go To Red Blue Ball</a></li>
  271. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/GoToDoor/">Go To Door</a></li>
  272. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/GoToObjDoor/">Go To Obj Door</a></li>
  273. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/Open/">Open</a></li>
  274. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/OpenRedDoor/">Open Red Door</a></li>
  275. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/OpenDoor/">Open Door</a></li>
  276. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/OpenTwoDoors/">Open Two Doors</a></li>
  277. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/OpenDoorsOrder/">Open Doors Order</a></li>
  278. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/Pickup/">Pickup</a></li>
  279. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/UnblockPickup/">Unblock Pickup</a></li>
  280. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/PickupLoc/">Pickup Loc</a></li>
  281. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/PickupDist/">Pickup Dist</a></li>
  282. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/PickupAbove/">Pickup Above</a></li>
  283. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/PutNextLocal/">Put Next Local</a></li>
  284. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/PutNext/">Put Next</a></li>
  285. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/Unlock/">Unlock</a></li>
  286. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/UnlockLocal/">Unlock Local</a></li>
  287. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/KeyInBox/">Key In Box</a></li>
  288. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/UnlockPickup/">Unlock Pickup</a></li>
  289. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/BlockedUnlockPickup/">Blocked Unlock Pickup</a></li>
  290. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/UnlockToUnlock/">Unlock To Unlock</a></li>
  291. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/ActionObjDoor/">Action Obj Door</a></li>
  292. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/FindObjS5/">Find Obj</a></li>
  293. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/KeyCorridor/">Key Corridor</a></li>
  294. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/OneRoomS8/">One Room</a></li>
  295. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/MoveTwoAcross/">Move Two Across</a></li>
  296. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/Synth/">Synth</a></li>
  297. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/SynthLoc/">Synth Loc</a></li>
  298. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/SynthSeq/">Synth Seq</a></li>
  299. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/MiniBossLevel/">Mini Boss Level</a></li>
  300. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/BossLevel/">Boss Level</a></li>
  301. <li class="toctree-l2"><a class="reference internal" href="../../environments/babyai/BossLevelNoUnlock/">Boss Level No Unlock</a></li>
  302. </ul>
  303. </li>
  304. </ul>
  305. <p class="caption" role="heading"><span class="caption-text">Development</span></p>
  306. <ul>
  307. <li class="toctree-l1"><a class="reference external" href="https://github.com/Farama-Foundation/MiniGrid">Github</a></li>
  308. </ul>
  309. </div>
  310. </div>
  311. </div>
  312. </div>
  313. </aside>
  314. <div class="main-container">
  315. <div class="main">
  316. <div class="content">
  317. <div class="article-container">
  318. <a href="#" class="back-to-top muted-link">
  319. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24">
  320. <path d="M13 20h-2V8l-5.5 5.5-1.42-1.42L12 4.16l7.92 7.92-1.42 1.42L13 8v12z"></path>
  321. </svg>
  322. <span>Back to top</span>
  323. </a>
  324. <div class="content-icon-container">
  325. <div class="edit-this-page">
  326. <a class="muted-link" href="https://github.com/Farama-Foundation/Minigrid/edit/master/docs/content/basic_usage.md" title="Edit this page">
  327. <svg aria-hidden="true" viewBox="0 0 24 24" stroke-width="1.5" stroke="currentColor" fill="none" stroke-linecap="round" stroke-linejoin="round">
  328. <path stroke="none" d="M0 0h24v24H0z" fill="none"/>
  329. <path d="M4 20h4l10.5 -10.5a1.5 1.5 0 0 0 -4 -4l-10.5 10.5v4" />
  330. <line x1="13.5" y1="6.5" x2="17.5" y2="10.5" />
  331. </svg>
  332. <span class="visually-hidden">Edit this page</span>
  333. </a>
  334. </div><div class="theme-toggle-container theme-toggle-content">
  335. <button class="theme-toggle">
  336. <div class="visually-hidden">Toggle Light / Dark / Auto color theme</div>
  337. <svg class="theme-icon-when-auto">
  338. <use href="#svg-sun-half"></use>
  339. </svg>
  340. <svg class="theme-icon-when-dark">
  341. <use href="#svg-moon"></use>
  342. </svg>
  343. <svg class="theme-icon-when-light">
  344. <use href="#svg-sun"></use>
  345. </svg>
  346. </button>
  347. </div>
  348. <label class="toc-overlay-icon toc-content-icon no-toc" for="__toc">
  349. <div class="visually-hidden">Toggle table of contents sidebar</div>
  350. <i class="icon"><svg>
  351. <use href="#svg-toc"></use>
  352. </svg></i>
  353. </label>
  354. </div>
  355. <article role="main">
  356. <section id="basic-usage">
  357. <h1>Basic Usage<a class="headerlink" href="#basic-usage" title="Permalink to this heading">#</a></h1>
  358. <p>There is a UI application which allows you to manually control the agent with the arrow keys:</p>
  359. <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="o">./</span><span class="n">minigrid</span><span class="o">/</span><span class="n">manual_control</span><span class="o">.</span><span class="n">py</span>
  360. </pre></div>
  361. </div>
  362. <p>The environment being run can be selected with the <code class="docutils literal notranslate"><span class="pre">--env</span></code> option, eg:</p>
  363. <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="o">./</span><span class="n">minigrid</span><span class="o">/</span><span class="n">manual_control</span><span class="o">.</span><span class="n">py</span> <span class="o">--</span><span class="n">env</span> <span class="n">MiniGrid</span><span class="o">-</span><span class="n">Empty</span><span class="o">-</span><span class="mi">8</span><span class="n">x8</span><span class="o">-</span><span class="n">v0</span>
  364. </pre></div>
  365. </div>
  366. </section>
  367. <section id="training-an-agent">
  368. <h1>Training an Agent<a class="headerlink" href="#training-an-agent" title="Permalink to this heading">#</a></h1>
  369. <p>If you want to train an agent with reinforcement learning, I recommend using the code found in the <a class="reference external" href="https://github.com/lcswillems/torch-rl">torch-rl</a> repository.
  370. This code has been tested and is known to work with this environment. The default hyper-parameters are also known to converge.</p>
  371. <p>A sample training command is:</p>
  372. <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">cd</span> <span class="n">torch</span><span class="o">-</span><span class="n">rl</span>
  373. <span class="n">python3</span> <span class="o">-</span><span class="n">m</span> <span class="n">scripts</span><span class="o">.</span><span class="n">train</span> <span class="o">--</span><span class="n">env</span> <span class="n">MiniGrid</span><span class="o">-</span><span class="n">Empty</span><span class="o">-</span><span class="mi">8</span><span class="n">x8</span><span class="o">-</span><span class="n">v0</span> <span class="o">--</span><span class="n">algo</span> <span class="n">ppo</span>
  374. </pre></div>
  375. </div>
  376. </section>
  377. </article>
  378. </div>
  379. <footer>
  380. <div class="related-pages">
  381. <a class="next-page" href="../publications/">
  382. <div class="page-info">
  383. <div class="context">
  384. <span>Next</span>
  385. </div>
  386. <div class="title">List of Publications</div>
  387. </div>
  388. <svg class="furo-related-icon">
  389. <use href="#svg-arrow-right"></use>
  390. </svg>
  391. </a>
  392. </div>
  393. <div class="bottom-of-page">
  394. <div class="left-details">
  395. <div class="copyright">
  396. Copyright &#169; 2022
  397. </div>
  398. <!--
  399. Made with <a href="https://www.sphinx-doc.org/">Sphinx</a> and <a class="muted-link" href="https://pradyunsg.me">@pradyunsg</a>'s
  400. <a href="https://github.com/pradyunsg/furo">Furo</a>
  401. -->
  402. </div>
  403. <div class="right-details">
  404. <div class="icons">
  405. <a class="muted-link" href="https://github.com/Farama-Foundation/Minigrid"
  406. aria-label="On GitHub">
  407. <svg stroke="currentColor" fill="currentColor" stroke-width="0" viewBox="0 0 16 16">
  408. <path fill-rule="evenodd"
  409. d="M8 0C3.58 0 0 3.58 0 8c0 3.54 2.29 6.53 5.47 7.59.4.07.55-.17.55-.38 0-.19-.01-.82-.01-1.49-2.01.37-2.53-.49-2.69-.94-.09-.23-.48-.94-.82-1.13-.28-.15-.68-.52-.01-.53.63-.01 1.08.58 1.23.82.72 1.21 1.87.87 2.33.66.07-.52.28-.87.51-1.07-1.78-.2-3.64-.89-3.64-3.95 0-.87.31-1.59.82-2.15-.08-.2-.36-1.02.08-2.12 0 0 .67-.21 2.2.82.64-.18 1.32-.27 2-.27.68 0 1.36.09 2 .27 1.53-1.04 2.2-.82 2.2-.82.44 1.1.16 1.92.08 2.12.51.56.82 1.27.82 2.15 0 3.07-1.87 3.75-3.65 3.95.29.25.54.73.54 1.48 0 1.07-.01 1.93-.01 2.2 0 .21.15.46.55.38A8.013 8.013 0 0 0 16 8c0-4.42-3.58-8-8-8z">
  410. </path>
  411. </svg>
  412. </a>
  413. </div>
  414. </div>
  415. </div>
  416. </footer>
  417. </div>
  418. <aside class="toc-drawer no-toc">
  419. </aside>
  420. </div>
  421. </div>
  422. </div>
  423. <script>
  424. const toggleMenu = () => {
  425. const menuBtn = document.querySelector(".farama-header-menu__btn");
  426. const menuContainer = document.querySelector(".farama-header-menu-container");
  427. if (document.querySelector(".farama-header-menu").classList.contains("active")) {
  428. menuBtn.setAttribute("aria-expanded", "false");
  429. menuContainer.setAttribute("aria-hidden", "true");
  430. } else {
  431. menuBtn.setAttribute("aria-expanded", "true");
  432. menuContainer.setAttribute("aria-hidden", "false");
  433. }
  434. document.querySelector(".farama-header-menu").classList.toggle("active");
  435. }
  436. document.querySelector(".farama-header-menu__btn").addEventListener("click", toggleMenu);
  437. document.getElementById("farama-close-menu").addEventListener("click", toggleMenu);
  438. </script>
  439. <script>
  440. (() => {
  441. if (!localStorage.getItem("shownCookieAlert")) {
  442. const boxElem = document.createElement("div");
  443. boxElem.classList.add("cookie-alert");
  444. const containerElem = document.createElement("div");
  445. containerElem.classList.add("cookie-alert__container");
  446. const textElem = document.createElement("p");
  447. textElem.innerHTML = `This page uses <a href="https://analytics.google.com/">
  448. Google Analytics</a> to collect statistics. You can disable it by blocking
  449. the JavaScript coming from www.google-analytics.com.`;
  450. containerElem.appendChild(textElem);
  451. const closeBtn = document.createElement("button");
  452. closeBtn.innerHTML = `<?xml version="1.0" ?><svg viewBox="0 0 32 32" xmlns="http://www.w3.org/2000/svg"><defs><style>.cls-1{fill:none;stroke:#000;stroke-linecap:round;stroke-linejoin:round;stroke-width:2px;}</style></defs><title/><g id="cross"><line class="cls-1" x1="7" x2="25" y1="7" y2="25"/><line class="cls-1" x1="7" x2="25" y1="25" y2="7"/></g></svg>`
  453. closeBtn.onclick = () => {
  454. localStorage.setItem("shownCookieAlert", "true");
  455. boxElem.style.display = "none";
  456. }
  457. containerElem.appendChild(closeBtn);
  458. boxElem.appendChild(containerElem);
  459. document.body.appendChild(boxElem);
  460. }
  461. })()
  462. </script>
  463. <script async src="https://www.googletagmanager.com/gtag/js?id=G-FBXJQQLXKD"></script>
  464. <script>
  465. window.dataLayer = window.dataLayer || [];
  466. function gtag(){dataLayer.push(arguments);}
  467. gtag('js', new Date());
  468. gtag('config', 'G-FBXJQQLXKD');
  469. </script>
  470. <script data-url_root="../../" id="documentation_options" src="../../_static/documentation_options.js"></script>
  471. <script src="../../_static/jquery.js"></script>
  472. <script src="../../_static/underscore.js"></script>
  473. <script src="../../_static/_sphinx_javascript_frameworks_compat.js"></script>
  474. <script src="../../_static/doctools.js"></script>
  475. <script src="../../_static/sphinx_highlight.js"></script>
  476. <script src="../../_static/scripts/furo.js"></script>
  477. <script>
  478. const createCORSRequest = (method, url) => {
  479. let xhr = new XMLHttpRequest();
  480. xhr.responseType = 'json';
  481. if ("withCredentials" in xhr) {
  482. xhr.open(method, url, true);
  483. } else if (typeof XDomainRequest != "undefined") {
  484. // IE8 & IE9
  485. xhr = new XDomainRequest();
  486. xhr.open(method, url);
  487. } else {
  488. // CORS not supported.
  489. xhr = null;
  490. }
  491. return xhr;
  492. };
  493. const url = 'https://farama.org/api/projects.json';
  494. const imagesBasepath = "https://farama.org/assets/images"
  495. const method = 'GET';
  496. let xhr = createCORSRequest(method, url);
  497. xhr.onload = () => {
  498. const jsonResponse = xhr.response;
  499. const sections = {
  500. "Documentation": [],
  501. "Mature Projects": [],
  502. "Incubating Projects": [],
  503. "Foundation": [
  504. {
  505. name: "About",
  506. link: "https://farama.org/about"
  507. },
  508. {
  509. name: "Standards",
  510. link: "https://farama.org/project_standards",
  511. },
  512. {
  513. name: "Donate",
  514. link: "https://farama.org/donations"
  515. }
  516. ]
  517. }
  518. Object.keys(jsonResponse).forEach(key => {
  519. projectJson = jsonResponse[key];
  520. if (projectJson.website !== null) {
  521. projectJson.link = projectJson.website;
  522. sections["Documentation"].push(projectJson)
  523. } else if (projectJson.type == "mature") {
  524. projectJson.link = projectJson.github;
  525. sections["Mature Projects"].push(projectJson)
  526. } else {
  527. projectJson.link = projectJson.github;
  528. sections["Incubating Projects"].push(projectJson)
  529. }
  530. })
  531. const menuContainer = document.querySelector(".farama-header-menu__body");
  532. Object.keys(sections).forEach((key, i) => {
  533. projects = sections[key];
  534. const sectionElem = Object.assign(
  535. document.createElement('div'), {
  536. className:'farama-header-menu__section',
  537. style: "padding-left: 24px"
  538. }
  539. )
  540. sectionElem.appendChild(Object.assign(document.createElement('span'),
  541. {
  542. className:'farama-header-menu__section-title' ,
  543. innerText: key
  544. }
  545. ))
  546. const ulElem = Object.assign(document.createElement('ul'),
  547. {
  548. className:'farama-header-menu-list',
  549. }
  550. )
  551. for (let project of projects) {
  552. const liElem = document.createElement("li");
  553. const aElem = Object.assign(document.createElement("a"),
  554. {
  555. href: project.link
  556. }
  557. );
  558. liElem.appendChild(aElem);
  559. if (key !== "Foundation") {
  560. const imgElem = Object.assign(document.createElement("img"),
  561. {
  562. src: project.image ? imagesBasepath + project.image : imagesBasepath + "/farama_black.svg",
  563. alt: `${project.name} logo`,
  564. className: "farama-black-logo-invert"
  565. }
  566. );
  567. aElem.appendChild(imgElem);
  568. }
  569. aElem.appendChild(document.createTextNode(project.name));
  570. ulElem.appendChild(liElem);
  571. }
  572. sectionElem.appendChild(ulElem);
  573. menuContainer.appendChild(sectionElem)
  574. });
  575. }
  576. xhr.onerror = function() {
  577. console.error("Unable to load projects");
  578. };
  579. xhr.send();
  580. </script>
  581. </body>
  582. </html>