index.html 137 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596
  1. <!doctype html>
  2. <html class="no-js" lang="en" data-content_root="../../../">
  3. <head><meta charset="utf-8"/>
  4. <meta name="viewport" content="width=device-width,initial-scale=1"/>
  5. <meta name="color-scheme" content="light dark">
  6. <meta name="description" content="Minigrid contains simple and easily configurable grid world environments to conduct Reinforcement Learning research. This library was previously known as gym-minigrid.">
  7. <meta property="og:title" content="MiniGrid Documentation" />
  8. <meta property="og:type" content="website" />
  9. <meta property="og:description" content="Minigrid contains simple and easily configurable grid world environments to conduct Reinforcement Learning research. This library was previously known as gym-minigrid." />
  10. <meta property="og:url" content="https://minigrid.farama.org/_modules/minigrid/wrappers.html" /><meta property="og:image" content="https://minigrid.farama.org//_static/img/minigrid-github.png" /><meta name="twitter:card" content="summary_large_image"><link rel="index" title="Index" href="../../../genindex/" /><link rel="search" title="Search" href="../../../search/" />
  11. <link rel="canonical" href="https://minigrid.farama.org/_modules/minigrid/wrappers.html" />
  12. <link rel="shortcut icon" href="../../../_static/minigrid-favicon.png"/><!-- Generated with Sphinx 7.2.6 and Furo 2023.08.19.dev1 -->
  13. <title>minigrid.wrappers - MiniGrid Documentation</title>
  14. <link rel="stylesheet" type="text/css" href="../../../_static/pygments.css?v=a746c00c" />
  15. <link rel="stylesheet" type="text/css" href="../../../_static/styles/furo.css?v=3e7f4c72" />
  16. <link rel="stylesheet" type="text/css" href="../../../_static/styles/furo-extensions.css?v=49cbaffd" />
  17. <style>
  18. body {
  19. --color-code-background: #f8f8f8;
  20. --color-code-foreground: black;
  21. }
  22. @media not print {
  23. body[data-theme="dark"] {
  24. --color-code-background: #202020;
  25. --color-code-foreground: #d0d0d0;
  26. }
  27. @media (prefers-color-scheme: dark) {
  28. body:not([data-theme="light"]) {
  29. --color-code-background: #202020;
  30. --color-code-foreground: #d0d0d0;
  31. }
  32. }
  33. }
  34. </style></head>
  35. <body>
  36. <header class="farama-header" aria-label="Farama header">
  37. <div class="farama-header__container">
  38. <div class="farama-header__left--mobile">
  39. <label class="nav-overlay-icon" for="__navigation">
  40. <div class="visually-hidden">Toggle site navigation sidebar</div>
  41. <svg viewBox="0 0 24 24" xmlns="http://www.w3.org/2000/svg">
  42. <defs></defs>
  43. <line x1="0.5" y1="4" x2="23.5" y2="4"></line>
  44. <line x1="0.232" y1="12" x2="23.5" y2="12"></line>
  45. <line x1="0.232" y1="20" x2="23.5" y2="20"></line>
  46. </svg>
  47. </label>
  48. </div>
  49. <div class="farama-header__left farama-header__center--mobile">
  50. <a href="../../../">
  51. <img class="farama-header__logo only-light" src="../../../_static/img/minigrid.svg" alt="Light Logo"/>
  52. <img class="farama-header__logo only-dark" src="../../../_static/img/minigrid-white.svg" alt="Dark Logo"/>
  53. <span class="farama-header__title">MiniGrid Documentation</span>
  54. </a>
  55. </div>
  56. <div class="farama-header__right">
  57. <div class="farama-header-menu">
  58. <button class="farama-header-menu__btn" aria-label="Open Farama Menu" aria-expanded="false" aria-haspopup="true" aria-controls="farama-menu">
  59. <img class="farama-black-logo-invert" src="../../../_static/img/farama-logo-header.svg">
  60. <svg viewBox="0 0 24 24" viewBox="0 0 24 24" xmlns="http://www.w3.org/2000/svg">
  61. <polyline style="stroke-linecap: round; stroke-linejoin: round; fill: none; stroke-width: 2px;" points="1 7 12 18 23 7"></polyline>
  62. </svg>
  63. </button>
  64. <div class="farama-header-menu-container farama-hidden" aria-hidden="true" id="farama-menu">
  65. <div class="farama-header-menu__header">
  66. <a href="https://farama.org">
  67. <img class="farama-header-menu__logo farama-white-logo-invert" src="../../../_static/img/farama_solid_white.svg" alt="Farama Foundation logo">
  68. <span>Farama Foundation</span>
  69. </a>
  70. <div class="farama-header-menu-header__right">
  71. <button id="farama-close-menu">
  72. <svg viewBox="0 0 24 24" xmlns="http://www.w3.org/2000/svg" fill="none" stroke="currentColor"
  73. stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="icon-close">
  74. <line x1="3" y1="21" x2="21" y2="3"></line>
  75. <line x1="3" y1="3" x2="21" y2="21"></line>
  76. </svg>
  77. </button>
  78. </div>
  79. </div>
  80. <div class="farama-header-menu__body">
  81. <!-- Response from farama.org/api/projects.json -->
  82. </div>
  83. </div>
  84. </div>
  85. </div>
  86. </div>
  87. </header>
  88. <script>
  89. document.body.dataset.theme = localStorage.getItem("theme") || "auto";
  90. </script>
  91. <svg xmlns="http://www.w3.org/2000/svg" style="display: none;">
  92. <symbol id="svg-toc" viewBox="0 0 24 24">
  93. <title>Contents</title>
  94. <svg stroke="currentColor" fill="currentColor" stroke-width="0" viewBox="0 0 1024 1024">
  95. <path d="M408 442h480c4.4 0 8-3.6 8-8v-56c0-4.4-3.6-8-8-8H408c-4.4 0-8 3.6-8 8v56c0 4.4 3.6 8 8 8zm-8 204c0 4.4 3.6 8 8 8h480c4.4 0 8-3.6 8-8v-56c0-4.4-3.6-8-8-8H408c-4.4 0-8 3.6-8 8v56zm504-486H120c-4.4 0-8 3.6-8 8v56c0 4.4 3.6 8 8 8h784c4.4 0 8-3.6 8-8v-56c0-4.4-3.6-8-8-8zm0 632H120c-4.4 0-8 3.6-8 8v56c0 4.4 3.6 8 8 8h784c4.4 0 8-3.6 8-8v-56c0-4.4-3.6-8-8-8zM115.4 518.9L271.7 642c5.8 4.6 14.4.5 14.4-6.9V388.9c0-7.4-8.5-11.5-14.4-6.9L115.4 505.1a8.74 8.74 0 0 0 0 13.8z"/>
  96. </svg>
  97. </symbol>
  98. <symbol id="svg-menu" viewBox="0 0 24 24">
  99. <title>Menu</title>
  100. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor"
  101. stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="feather-menu">
  102. <line x1="3" y1="12" x2="21" y2="12"></line>
  103. <line x1="3" y1="6" x2="21" y2="6"></line>
  104. <line x1="3" y1="18" x2="21" y2="18"></line>
  105. </svg>
  106. </symbol>
  107. <symbol id="svg-arrow-right" viewBox="0 0 24 24">
  108. <title>Expand</title>
  109. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor"
  110. stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="feather-chevron-right">
  111. <polyline points="9 18 15 12 9 6"></polyline>
  112. </svg>
  113. </symbol>
  114. <symbol id="svg-sun" viewBox="0 0 24 24">
  115. <title>Light mode</title>
  116. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor"
  117. stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round" class="feather-sun">
  118. <circle cx="12" cy="12" r="5"></circle>
  119. <line x1="12" y1="1" x2="12" y2="3"></line>
  120. <line x1="12" y1="21" x2="12" y2="23"></line>
  121. <line x1="4.22" y1="4.22" x2="5.64" y2="5.64"></line>
  122. <line x1="18.36" y1="18.36" x2="19.78" y2="19.78"></line>
  123. <line x1="1" y1="12" x2="3" y2="12"></line>
  124. <line x1="21" y1="12" x2="23" y2="12"></line>
  125. <line x1="4.22" y1="19.78" x2="5.64" y2="18.36"></line>
  126. <line x1="18.36" y1="5.64" x2="19.78" y2="4.22"></line>
  127. </svg>
  128. </symbol>
  129. <symbol id="svg-moon" viewBox="0 0 24 24">
  130. <title>Dark mode</title>
  131. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor"
  132. stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round" class="icon-tabler-moon">
  133. <path stroke="none" d="M0 0h24v24H0z" fill="none" />
  134. <path d="M12 3c.132 0 .263 0 .393 0a7.5 7.5 0 0 0 7.92 12.446a9 9 0 1 1 -8.313 -12.454z" />
  135. </svg>
  136. </symbol>
  137. <symbol id="svg-sun-half" viewBox="0 0 24 24">
  138. <title>Auto light/dark mode</title>
  139. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor"
  140. stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round" class="icon-tabler-shadow">
  141. <path stroke="none" d="M0 0h24v24H0z" fill="none"/>
  142. <circle cx="12" cy="12" r="9" />
  143. <path d="M13 12h5" />
  144. <path d="M13 15h4" />
  145. <path d="M13 18h1" />
  146. <path d="M13 9h4" />
  147. <path d="M13 6h1" />
  148. </svg>
  149. </symbol>
  150. </svg>
  151. <input type="checkbox" class="sidebar-toggle" name="__navigation" id="__navigation">
  152. <input type="checkbox" class="sidebar-toggle" name="__toc" id="__toc">
  153. <label class="overlay sidebar-overlay" for="__navigation">
  154. <div class="visually-hidden">Hide navigation sidebar</div>
  155. </label>
  156. <label class="overlay toc-overlay" for="__toc">
  157. <div class="visually-hidden">Hide table of contents sidebar</div>
  158. </label>
  159. <div class="page">
  160. <!--<header class="mobile-header">
  161. <div class="header-left">
  162. <label class="nav-overlay-icon" for="__navigation">
  163. <div class="visually-hidden">Toggle site navigation sidebar</div>
  164. <i class="icon"><svg><use href="#svg-menu"></use></svg></i>
  165. </label>
  166. </div>
  167. <div class="header-center">
  168. <a href="../../../"><div class="brand">MiniGrid Documentation</div></a>
  169. </div>
  170. <div class="header-right">
  171. <div class="theme-toggle-container theme-toggle-header">
  172. <button class="theme-toggle">
  173. <div class="visually-hidden">Toggle Light / Dark / Auto color theme</div>
  174. <svg class="theme-icon-when-auto"><use href="#svg-sun-half"></use></svg>
  175. <svg class="theme-icon-when-dark"><use href="#svg-moon"></use></svg>
  176. <svg class="theme-icon-when-light"><use href="#svg-sun"></use></svg>
  177. </button>
  178. </div>
  179. <label class="toc-overlay-icon toc-header-icon no-toc" for="__toc">
  180. <div class="visually-hidden">Toggle table of contents sidebar</div>
  181. <i class="icon"><svg><use href="#svg-toc"></use></svg></i>
  182. </label>
  183. </div>
  184. </header>-->
  185. <aside class="sidebar-drawer">
  186. <div class="sidebar-container">
  187. <div class="sidebar-sticky"><a class="farama-sidebar__title" href="../../../">
  188. <img class="farama-header__logo only-light" src="../../../_static/img/minigrid.svg" alt="Light Logo"/>
  189. <img class="farama-header__logo only-dark" src="../../../_static/img/minigrid-white.svg" alt="Dark Logo"/>
  190. <span class="farama-header__title">MiniGrid Documentation</span>
  191. </a><form class="sidebar-search-container" method="get" action="../../../search/" role="search">
  192. <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
  193. <input type="hidden" name="check_keywords" value="yes">
  194. <input type="hidden" name="area" value="default">
  195. </form>
  196. <div id="searchbox"></div><div class="sidebar-scroll"><div class="sidebar-tree">
  197. <p class="caption" role="heading"><span class="caption-text">Introduction</span></p>
  198. <ul>
  199. <li class="toctree-l1"><a class="reference internal" href="../../../content/basic_usage/">Basic Usage</a></li>
  200. <li class="toctree-l1"><a class="reference internal" href="../../../content/basic_usage/#installation">Installation</a></li>
  201. <li class="toctree-l1"><a class="reference internal" href="../../../content/publications/">List of Publications</a></li>
  202. <li class="toctree-l1"><a class="reference internal" href="../../../content/create_env_tutorial/">Tutorial on Creating Environments</a></li>
  203. <li class="toctree-l1"><a class="reference internal" href="../../../content/training/">Training Minigrid Environments</a></li>
  204. </ul>
  205. <p class="caption" role="heading"><span class="caption-text">Wrappers</span></p>
  206. <ul>
  207. <li class="toctree-l1 has-children"><a class="reference internal" href="../../../api/wrapper/">Wrapper</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Wrapper</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
  208. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/">Action Bonus</a></li>
  209. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#dict-observation-space">Dict Observation Space</a></li>
  210. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#direction-obs">Direction Obs</a></li>
  211. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#flatobs">FlatObs</a></li>
  212. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#fully-obs">Fully Obs</a></li>
  213. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#image-observation">Image Observation</a></li>
  214. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#no-death">No Death</a></li>
  215. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#observation">Observation</a></li>
  216. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#one-hot-partial-obs">One Hot Partial Obs</a></li>
  217. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#reseed">Reseed</a></li>
  218. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#rgb-img-obs">RGB Img Obs</a></li>
  219. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#rgb-partial-img-obs">RGB Partial Img Obs</a></li>
  220. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#position-bonus">Position Bonus</a></li>
  221. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#stochastic-action">Stochastic Action</a></li>
  222. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#symbolic-obs">Symbolic Obs</a></li>
  223. <li class="toctree-l2"><a class="reference internal" href="../../../api/wrappers/#view-size">View Size</a></li>
  224. </ul>
  225. </li>
  226. </ul>
  227. <p class="caption" role="heading"><span class="caption-text">Environments</span></p>
  228. <ul>
  229. <li class="toctree-l1 has-children"><a class="reference internal" href="../../../environments/minigrid/">Minigrid Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Minigrid Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
  230. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/BlockedUnlockPickupEnv/">Blocked Unlock Pickup</a></li>
  231. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/CrossingEnv/">Crossing</a></li>
  232. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/DistShiftEnv/">Dist Shift</a></li>
  233. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/DoorKeyEnv/">Door Key</a></li>
  234. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/DynamicObstaclesEnv/">Dynamic Obstacles</a></li>
  235. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/EmptyEnv/">Empty</a></li>
  236. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/FetchEnv/">Fetch</a></li>
  237. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/FourRoomsEnv/">Four Rooms</a></li>
  238. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/GoToDoorEnv/">Go To Door</a></li>
  239. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/GoToObjectEnv/">Go To Object</a></li>
  240. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/KeyCorridorEnv/">Key Corridor</a></li>
  241. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/LavaGapEnv/">Lava Gap</a></li>
  242. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/LockedRoomEnv/">Locked Room</a></li>
  243. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/MemoryEnv/">Memory</a></li>
  244. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/MultiRoomEnv/">Multi Room</a></li>
  245. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/ObstructedMaze_1Dlhb/">Obstructed Maze Dlhb</a></li>
  246. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/ObstructedMaze_Full/">Obstructed Maze Full</a></li>
  247. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/PlaygroundEnv/">Playground</a></li>
  248. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/PutNearEnv/">Put Near</a></li>
  249. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/RedBlueDoorEnv/">Red Blue Door</a></li>
  250. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/UnlockEnv/">Unlock</a></li>
  251. <li class="toctree-l2"><a class="reference internal" href="../../../environments/minigrid/UnlockPickupEnv/">Unlock Pickup</a></li>
  252. </ul>
  253. </li>
  254. <li class="toctree-l1 has-children"><a class="reference internal" href="../../../environments/babyai/">BabyAI Environments</a><input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" role="switch" type="checkbox"/><label for="toctree-checkbox-3"><div class="visually-hidden">Toggle navigation of BabyAI Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
  255. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/GoToRedBallGrey/">Go To Red Ball Grey</a></li>
  256. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/GoToRedBall/">Go To Red Ball</a></li>
  257. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/GoToRedBallNoDists/">Go To Red Ball No Dists</a></li>
  258. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/GoToObj/">Go To Obj</a></li>
  259. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/GoToLocal/">Go To Local</a></li>
  260. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/GoTo/">Go To</a></li>
  261. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/GoToImpUnlock/">Go To Imp Unlock</a></li>
  262. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/GoToSeq/">Go To Seq</a></li>
  263. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/GoToRedBlueBall/">Go To Red Blue Ball</a></li>
  264. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/GoToDoor/">Go To Door</a></li>
  265. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/GoToObjDoor/">Go To Obj Door</a></li>
  266. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/Open/">Open</a></li>
  267. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/OpenRedDoor/">Open Red Door</a></li>
  268. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/OpenDoor/">Open Door</a></li>
  269. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/OpenTwoDoors/">Open Two Doors</a></li>
  270. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/OpenDoorsOrder/">Open Doors Order</a></li>
  271. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/Pickup/">Pickup</a></li>
  272. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/UnblockPickup/">Unblock Pickup</a></li>
  273. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/PickupLoc/">Pickup Loc</a></li>
  274. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/PickupDist/">Pickup Dist</a></li>
  275. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/PickupAbove/">Pickup Above</a></li>
  276. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/PutNextLocal/">Put Next Local</a></li>
  277. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/PutNext/">Put Next</a></li>
  278. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/Unlock/">Unlock</a></li>
  279. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/UnlockLocal/">Unlock Local</a></li>
  280. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/KeyInBox/">Key In Box</a></li>
  281. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/UnlockPickup/">Unlock Pickup</a></li>
  282. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/BlockedUnlockPickup/">Blocked Unlock Pickup</a></li>
  283. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/UnlockToUnlock/">Unlock To Unlock</a></li>
  284. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/ActionObjDoor/">Action Obj Door</a></li>
  285. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/FindObjS5/">Find Obj</a></li>
  286. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/KeyCorridor/">Key Corridor</a></li>
  287. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/OneRoomS8/">One Room</a></li>
  288. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/MoveTwoAcross/">Move Two Across</a></li>
  289. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/Synth/">Synth</a></li>
  290. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/SynthLoc/">Synth Loc</a></li>
  291. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/SynthSeq/">Synth Seq</a></li>
  292. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/MiniBossLevel/">Mini Boss Level</a></li>
  293. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/BossLevel/">Boss Level</a></li>
  294. <li class="toctree-l2"><a class="reference internal" href="../../../environments/babyai/BossLevelNoUnlock/">Boss Level No Unlock</a></li>
  295. </ul>
  296. </li>
  297. </ul>
  298. <p class="caption" role="heading"><span class="caption-text">Development</span></p>
  299. <ul>
  300. <li class="toctree-l1"><a class="reference internal" href="../../../release_notes/">Release Notes</a></li>
  301. <li class="toctree-l1"><a class="reference external" href="https://github.com/Farama-Foundation/MiniGrid">Github</a></li>
  302. </ul>
  303. </div>
  304. </div>
  305. </div>
  306. </div>
  307. </aside>
  308. <div class="main-container">
  309. <div class="main">
  310. <div class="content">
  311. <div class="article-container">
  312. <a href="#" class="back-to-top muted-link">
  313. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24">
  314. <path d="M13 20h-2V8l-5.5 5.5-1.42-1.42L12 4.16l7.92 7.92-1.42 1.42L13 8v12z"></path>
  315. </svg>
  316. <span>Back to top</span>
  317. </a>
  318. <div class="content-icon-container"><div class="theme-toggle-container theme-toggle-content">
  319. <button class="theme-toggle" title="Toggle color theme">
  320. <div class="visually-hidden">Toggle Light / Dark / Auto color theme</div>
  321. <svg class="theme-icon-when-auto">
  322. <use href="#svg-sun-half"></use>
  323. </svg>
  324. <svg class="theme-icon-when-dark">
  325. <use href="#svg-moon"></use>
  326. </svg>
  327. <svg class="theme-icon-when-light">
  328. <use href="#svg-sun"></use>
  329. </svg>
  330. </button>
  331. </div>
  332. <label class="toc-overlay-icon toc-content-icon no-toc" for="__toc">
  333. <div class="visually-hidden">Toggle table of contents sidebar</div>
  334. <i class="icon"><svg>
  335. <use href="#svg-toc"></use>
  336. </svg></i>
  337. </label>
  338. </div>
  339. <article role="main">
  340. <h1>Source code for minigrid.wrappers</h1><div class="highlight"><pre>
  341. <span></span><span class="kn">from</span> <span class="nn">__future__</span> <span class="kn">import</span> <span class="n">annotations</span>
  342. <span class="kn">import</span> <span class="nn">math</span>
  343. <span class="kn">import</span> <span class="nn">operator</span>
  344. <span class="kn">from</span> <span class="nn">functools</span> <span class="kn">import</span> <span class="n">reduce</span>
  345. <span class="kn">from</span> <span class="nn">typing</span> <span class="kn">import</span> <span class="n">Any</span>
  346. <span class="kn">import</span> <span class="nn">gymnasium</span> <span class="k">as</span> <span class="nn">gym</span>
  347. <span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
  348. <span class="kn">from</span> <span class="nn">gymnasium</span> <span class="kn">import</span> <span class="n">logger</span><span class="p">,</span> <span class="n">spaces</span>
  349. <span class="kn">from</span> <span class="nn">gymnasium.core</span> <span class="kn">import</span> <span class="n">ActionWrapper</span><span class="p">,</span> <span class="n">ObservationWrapper</span><span class="p">,</span> <span class="n">ObsType</span><span class="p">,</span> <span class="n">Wrapper</span>
  350. <span class="kn">from</span> <span class="nn">minigrid.core.constants</span> <span class="kn">import</span> <span class="n">COLOR_TO_IDX</span><span class="p">,</span> <span class="n">OBJECT_TO_IDX</span><span class="p">,</span> <span class="n">STATE_TO_IDX</span>
  351. <span class="kn">from</span> <span class="nn">minigrid.core.world_object</span> <span class="kn">import</span> <span class="n">Goal</span>
  352. <div class="viewcode-block" id="ReseedWrapper">
  353. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.ReseedWrapper">[docs]</a>
  354. <span class="k">class</span> <span class="nc">ReseedWrapper</span><span class="p">(</span><span class="n">Wrapper</span><span class="p">):</span>
  355. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  356. <span class="sd"> Wrapper to always regenerate an environment with the same set of seeds.</span>
  357. <span class="sd"> This can be used to force an environment to always keep the same</span>
  358. <span class="sd"> configuration when reset.</span>
  359. <span class="sd"> Example:</span>
  360. <span class="sd"> &gt;&gt;&gt; import minigrid</span>
  361. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  362. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import ReseedWrapper</span>
  363. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-Empty-5x5-v0&quot;)</span>
  364. <span class="sd"> &gt;&gt;&gt; _ = env.reset(seed=123)</span>
  365. <span class="sd"> &gt;&gt;&gt; [env.np_random.integers(10) for i in range(10)]</span>
  366. <span class="sd"> [0, 6, 5, 0, 9, 2, 2, 1, 3, 1]</span>
  367. <span class="sd"> &gt;&gt;&gt; env = ReseedWrapper(env, seeds=[0, 1], seed_idx=0)</span>
  368. <span class="sd"> &gt;&gt;&gt; _, _ = env.reset()</span>
  369. <span class="sd"> &gt;&gt;&gt; [env.np_random.integers(10) for i in range(10)]</span>
  370. <span class="sd"> [8, 6, 5, 2, 3, 0, 0, 0, 1, 8]</span>
  371. <span class="sd"> &gt;&gt;&gt; _, _ = env.reset()</span>
  372. <span class="sd"> &gt;&gt;&gt; [env.np_random.integers(10) for i in range(10)]</span>
  373. <span class="sd"> [4, 5, 7, 9, 0, 1, 8, 9, 2, 3]</span>
  374. <span class="sd"> &gt;&gt;&gt; _, _ = env.reset()</span>
  375. <span class="sd"> &gt;&gt;&gt; [env.np_random.integers(10) for i in range(10)]</span>
  376. <span class="sd"> [8, 6, 5, 2, 3, 0, 0, 0, 1, 8]</span>
  377. <span class="sd"> &gt;&gt;&gt; _, _ = env.reset()</span>
  378. <span class="sd"> &gt;&gt;&gt; [env.np_random.integers(10) for i in range(10)]</span>
  379. <span class="sd"> [4, 5, 7, 9, 0, 1, 8, 9, 2, 3]</span>
  380. <span class="sd"> &quot;&quot;&quot;</span>
  381. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">,</span> <span class="n">seeds</span><span class="o">=</span><span class="p">(</span><span class="mi">0</span><span class="p">,),</span> <span class="n">seed_idx</span><span class="o">=</span><span class="mi">0</span><span class="p">):</span>
  382. <span class="w"> </span><span class="sd">&quot;&quot;&quot;A wrapper that always regenerate an environment with the same set of seeds.</span>
  383. <span class="sd"> Args:</span>
  384. <span class="sd"> env: The environment to apply the wrapper</span>
  385. <span class="sd"> seeds: A list of seed to be applied to the env</span>
  386. <span class="sd"> seed_idx: Index of the initial seed in seeds</span>
  387. <span class="sd"> &quot;&quot;&quot;</span>
  388. <span class="bp">self</span><span class="o">.</span><span class="n">seeds</span> <span class="o">=</span> <span class="nb">list</span><span class="p">(</span><span class="n">seeds</span><span class="p">)</span>
  389. <span class="bp">self</span><span class="o">.</span><span class="n">seed_idx</span> <span class="o">=</span> <span class="n">seed_idx</span>
  390. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  391. <span class="k">def</span> <span class="nf">reset</span><span class="p">(</span>
  392. <span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">seed</span><span class="p">:</span> <span class="nb">int</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span><span class="p">,</span> <span class="n">options</span><span class="p">:</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">]</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span>
  393. <span class="p">)</span> <span class="o">-&gt;</span> <span class="nb">tuple</span><span class="p">[</span><span class="n">ObsType</span><span class="p">,</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">]]:</span>
  394. <span class="k">if</span> <span class="n">seed</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
  395. <span class="n">logger</span><span class="o">.</span><span class="n">warn</span><span class="p">(</span>
  396. <span class="s2">&quot;A seed has been passed to `ReseedWrapper.reset` which is ignored.&quot;</span>
  397. <span class="p">)</span>
  398. <span class="n">seed</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">seeds</span><span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">seed_idx</span><span class="p">]</span>
  399. <span class="bp">self</span><span class="o">.</span><span class="n">seed_idx</span> <span class="o">=</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">seed_idx</span> <span class="o">+</span> <span class="mi">1</span><span class="p">)</span> <span class="o">%</span> <span class="nb">len</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">seeds</span><span class="p">)</span>
  400. <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">env</span><span class="o">.</span><span class="n">reset</span><span class="p">(</span><span class="n">seed</span><span class="o">=</span><span class="n">seed</span><span class="p">,</span> <span class="n">options</span><span class="o">=</span><span class="n">options</span><span class="p">)</span></div>
  401. <div class="viewcode-block" id="ActionBonus">
  402. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.ActionBonus">[docs]</a>
  403. <span class="k">class</span> <span class="nc">ActionBonus</span><span class="p">(</span><span class="n">gym</span><span class="o">.</span><span class="n">Wrapper</span><span class="p">):</span>
  404. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  405. <span class="sd"> Wrapper which adds an exploration bonus.</span>
  406. <span class="sd"> This is a reward to encourage exploration of less</span>
  407. <span class="sd"> visited (state,action) pairs.</span>
  408. <span class="sd"> Example:</span>
  409. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  410. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import ActionBonus</span>
  411. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-Empty-5x5-v0&quot;)</span>
  412. <span class="sd"> &gt;&gt;&gt; _, _ = env.reset(seed=0)</span>
  413. <span class="sd"> &gt;&gt;&gt; _, reward, _, _, _ = env.step(1)</span>
  414. <span class="sd"> &gt;&gt;&gt; print(reward)</span>
  415. <span class="sd"> 0</span>
  416. <span class="sd"> &gt;&gt;&gt; _, reward, _, _, _ = env.step(1)</span>
  417. <span class="sd"> &gt;&gt;&gt; print(reward)</span>
  418. <span class="sd"> 0</span>
  419. <span class="sd"> &gt;&gt;&gt; env_bonus = ActionBonus(env)</span>
  420. <span class="sd"> &gt;&gt;&gt; _, _ = env_bonus.reset(seed=0)</span>
  421. <span class="sd"> &gt;&gt;&gt; _, reward, _, _, _ = env_bonus.step(1)</span>
  422. <span class="sd"> &gt;&gt;&gt; print(reward)</span>
  423. <span class="sd"> 1.0</span>
  424. <span class="sd"> &gt;&gt;&gt; _, reward, _, _, _ = env_bonus.step(1)</span>
  425. <span class="sd"> &gt;&gt;&gt; print(reward)</span>
  426. <span class="sd"> 1.0</span>
  427. <span class="sd"> &quot;&quot;&quot;</span>
  428. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">):</span>
  429. <span class="w"> </span><span class="sd">&quot;&quot;&quot;A wrapper that adds an exploration bonus to less visited (state,action) pairs.</span>
  430. <span class="sd"> Args:</span>
  431. <span class="sd"> env: The environment to apply the wrapper</span>
  432. <span class="sd"> &quot;&quot;&quot;</span>
  433. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  434. <span class="bp">self</span><span class="o">.</span><span class="n">counts</span> <span class="o">=</span> <span class="p">{}</span>
  435. <span class="k">def</span> <span class="nf">step</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">action</span><span class="p">):</span>
  436. <span class="w"> </span><span class="sd">&quot;&quot;&quot;Steps through the environment with `action`.&quot;&quot;&quot;</span>
  437. <span class="n">obs</span><span class="p">,</span> <span class="n">reward</span><span class="p">,</span> <span class="n">terminated</span><span class="p">,</span> <span class="n">truncated</span><span class="p">,</span> <span class="n">info</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">env</span><span class="o">.</span><span class="n">step</span><span class="p">(</span><span class="n">action</span><span class="p">)</span>
  438. <span class="n">env</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">unwrapped</span>
  439. <span class="n">tup</span> <span class="o">=</span> <span class="p">(</span><span class="nb">tuple</span><span class="p">(</span><span class="n">env</span><span class="o">.</span><span class="n">agent_pos</span><span class="p">),</span> <span class="n">env</span><span class="o">.</span><span class="n">agent_dir</span><span class="p">,</span> <span class="n">action</span><span class="p">)</span>
  440. <span class="c1"># Get the count for this (s,a) pair</span>
  441. <span class="n">pre_count</span> <span class="o">=</span> <span class="mi">0</span>
  442. <span class="k">if</span> <span class="n">tup</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">counts</span><span class="p">:</span>
  443. <span class="n">pre_count</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">counts</span><span class="p">[</span><span class="n">tup</span><span class="p">]</span>
  444. <span class="c1"># Update the count for this (s,a) pair</span>
  445. <span class="n">new_count</span> <span class="o">=</span> <span class="n">pre_count</span> <span class="o">+</span> <span class="mi">1</span>
  446. <span class="bp">self</span><span class="o">.</span><span class="n">counts</span><span class="p">[</span><span class="n">tup</span><span class="p">]</span> <span class="o">=</span> <span class="n">new_count</span>
  447. <span class="n">bonus</span> <span class="o">=</span> <span class="mi">1</span> <span class="o">/</span> <span class="n">math</span><span class="o">.</span><span class="n">sqrt</span><span class="p">(</span><span class="n">new_count</span><span class="p">)</span>
  448. <span class="n">reward</span> <span class="o">+=</span> <span class="n">bonus</span>
  449. <span class="k">return</span> <span class="n">obs</span><span class="p">,</span> <span class="n">reward</span><span class="p">,</span> <span class="n">terminated</span><span class="p">,</span> <span class="n">truncated</span><span class="p">,</span> <span class="n">info</span></div>
  450. <div class="viewcode-block" id="PositionBonus">
  451. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.PositionBonus">[docs]</a>
  452. <span class="k">class</span> <span class="nc">PositionBonus</span><span class="p">(</span><span class="n">Wrapper</span><span class="p">):</span>
  453. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  454. <span class="sd"> Adds an exploration bonus based on which positions</span>
  455. <span class="sd"> are visited on the grid.</span>
  456. <span class="sd"> Note:</span>
  457. <span class="sd"> This wrapper was previously called ``StateBonus``.</span>
  458. <span class="sd"> Example:</span>
  459. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  460. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import PositionBonus</span>
  461. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-Empty-5x5-v0&quot;)</span>
  462. <span class="sd"> &gt;&gt;&gt; _, _ = env.reset(seed=0)</span>
  463. <span class="sd"> &gt;&gt;&gt; _, reward, _, _, _ = env.step(1)</span>
  464. <span class="sd"> &gt;&gt;&gt; print(reward)</span>
  465. <span class="sd"> 0</span>
  466. <span class="sd"> &gt;&gt;&gt; _, reward, _, _, _ = env.step(1)</span>
  467. <span class="sd"> &gt;&gt;&gt; print(reward)</span>
  468. <span class="sd"> 0</span>
  469. <span class="sd"> &gt;&gt;&gt; env_bonus = PositionBonus(env)</span>
  470. <span class="sd"> &gt;&gt;&gt; obs, _ = env_bonus.reset(seed=0)</span>
  471. <span class="sd"> &gt;&gt;&gt; obs, reward, terminated, truncated, info = env_bonus.step(1)</span>
  472. <span class="sd"> &gt;&gt;&gt; print(reward)</span>
  473. <span class="sd"> 1.0</span>
  474. <span class="sd"> &gt;&gt;&gt; obs, reward, terminated, truncated, info = env_bonus.step(1)</span>
  475. <span class="sd"> &gt;&gt;&gt; print(reward)</span>
  476. <span class="sd"> 0.7071067811865475</span>
  477. <span class="sd"> &quot;&quot;&quot;</span>
  478. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">):</span>
  479. <span class="w"> </span><span class="sd">&quot;&quot;&quot;A wrapper that adds an exploration bonus to less visited positions.</span>
  480. <span class="sd"> Args:</span>
  481. <span class="sd"> env: The environment to apply the wrapper</span>
  482. <span class="sd"> &quot;&quot;&quot;</span>
  483. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  484. <span class="bp">self</span><span class="o">.</span><span class="n">counts</span> <span class="o">=</span> <span class="p">{}</span>
  485. <span class="k">def</span> <span class="nf">step</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">action</span><span class="p">):</span>
  486. <span class="w"> </span><span class="sd">&quot;&quot;&quot;Steps through the environment with `action`.&quot;&quot;&quot;</span>
  487. <span class="n">obs</span><span class="p">,</span> <span class="n">reward</span><span class="p">,</span> <span class="n">terminated</span><span class="p">,</span> <span class="n">truncated</span><span class="p">,</span> <span class="n">info</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">env</span><span class="o">.</span><span class="n">step</span><span class="p">(</span><span class="n">action</span><span class="p">)</span>
  488. <span class="c1"># Tuple based on which we index the counts</span>
  489. <span class="c1"># We use the position after an update</span>
  490. <span class="n">env</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">unwrapped</span>
  491. <span class="n">tup</span> <span class="o">=</span> <span class="nb">tuple</span><span class="p">(</span><span class="n">env</span><span class="o">.</span><span class="n">agent_pos</span><span class="p">)</span>
  492. <span class="c1"># Get the count for this key</span>
  493. <span class="n">pre_count</span> <span class="o">=</span> <span class="mi">0</span>
  494. <span class="k">if</span> <span class="n">tup</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">counts</span><span class="p">:</span>
  495. <span class="n">pre_count</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">counts</span><span class="p">[</span><span class="n">tup</span><span class="p">]</span>
  496. <span class="c1"># Update the count for this key</span>
  497. <span class="n">new_count</span> <span class="o">=</span> <span class="n">pre_count</span> <span class="o">+</span> <span class="mi">1</span>
  498. <span class="bp">self</span><span class="o">.</span><span class="n">counts</span><span class="p">[</span><span class="n">tup</span><span class="p">]</span> <span class="o">=</span> <span class="n">new_count</span>
  499. <span class="n">bonus</span> <span class="o">=</span> <span class="mi">1</span> <span class="o">/</span> <span class="n">math</span><span class="o">.</span><span class="n">sqrt</span><span class="p">(</span><span class="n">new_count</span><span class="p">)</span>
  500. <span class="n">reward</span> <span class="o">+=</span> <span class="n">bonus</span>
  501. <span class="k">return</span> <span class="n">obs</span><span class="p">,</span> <span class="n">reward</span><span class="p">,</span> <span class="n">terminated</span><span class="p">,</span> <span class="n">truncated</span><span class="p">,</span> <span class="n">info</span></div>
  502. <div class="viewcode-block" id="ImgObsWrapper">
  503. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.ImgObsWrapper">[docs]</a>
  504. <span class="k">class</span> <span class="nc">ImgObsWrapper</span><span class="p">(</span><span class="n">ObservationWrapper</span><span class="p">):</span>
  505. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  506. <span class="sd"> Use the image as the only observation output, no language/mission.</span>
  507. <span class="sd"> Example:</span>
  508. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  509. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import ImgObsWrapper</span>
  510. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-Empty-5x5-v0&quot;)</span>
  511. <span class="sd"> &gt;&gt;&gt; obs, _ = env.reset()</span>
  512. <span class="sd"> &gt;&gt;&gt; obs.keys()</span>
  513. <span class="sd"> dict_keys([&#39;image&#39;, &#39;direction&#39;, &#39;mission&#39;])</span>
  514. <span class="sd"> &gt;&gt;&gt; env = ImgObsWrapper(env)</span>
  515. <span class="sd"> &gt;&gt;&gt; obs, _ = env.reset()</span>
  516. <span class="sd"> &gt;&gt;&gt; obs.shape</span>
  517. <span class="sd"> (7, 7, 3)</span>
  518. <span class="sd"> &quot;&quot;&quot;</span>
  519. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">):</span>
  520. <span class="w"> </span><span class="sd">&quot;&quot;&quot;A wrapper that makes image the only observation.</span>
  521. <span class="sd"> Args:</span>
  522. <span class="sd"> env: The environment to apply the wrapper</span>
  523. <span class="sd"> &quot;&quot;&quot;</span>
  524. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  525. <span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">observation_space</span><span class="o">.</span><span class="n">spaces</span><span class="p">[</span><span class="s2">&quot;image&quot;</span><span class="p">]</span>
  526. <span class="k">def</span> <span class="nf">observation</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">obs</span><span class="p">):</span>
  527. <span class="k">return</span> <span class="n">obs</span><span class="p">[</span><span class="s2">&quot;image&quot;</span><span class="p">]</span></div>
  528. <div class="viewcode-block" id="OneHotPartialObsWrapper">
  529. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.OneHotPartialObsWrapper">[docs]</a>
  530. <span class="k">class</span> <span class="nc">OneHotPartialObsWrapper</span><span class="p">(</span><span class="n">ObservationWrapper</span><span class="p">):</span>
  531. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  532. <span class="sd"> Wrapper to get a one-hot encoding of a partially observable</span>
  533. <span class="sd"> agent view as observation.</span>
  534. <span class="sd"> Example:</span>
  535. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  536. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import OneHotPartialObsWrapper</span>
  537. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-Empty-5x5-v0&quot;)</span>
  538. <span class="sd"> &gt;&gt;&gt; obs, _ = env.reset()</span>
  539. <span class="sd"> &gt;&gt;&gt; obs[&quot;image&quot;][0, :, :]</span>
  540. <span class="sd"> array([[2, 5, 0],</span>
  541. <span class="sd"> [2, 5, 0],</span>
  542. <span class="sd"> [2, 5, 0],</span>
  543. <span class="sd"> [2, 5, 0],</span>
  544. <span class="sd"> [2, 5, 0],</span>
  545. <span class="sd"> [2, 5, 0],</span>
  546. <span class="sd"> [2, 5, 0]], dtype=uint8)</span>
  547. <span class="sd"> &gt;&gt;&gt; env = OneHotPartialObsWrapper(env)</span>
  548. <span class="sd"> &gt;&gt;&gt; obs, _ = env.reset()</span>
  549. <span class="sd"> &gt;&gt;&gt; obs[&quot;image&quot;][0, :, :]</span>
  550. <span class="sd"> array([[0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0],</span>
  551. <span class="sd"> [0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0],</span>
  552. <span class="sd"> [0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0],</span>
  553. <span class="sd"> [0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0],</span>
  554. <span class="sd"> [0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0],</span>
  555. <span class="sd"> [0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0],</span>
  556. <span class="sd"> [0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0]],</span>
  557. <span class="sd"> dtype=uint8)</span>
  558. <span class="sd"> &quot;&quot;&quot;</span>
  559. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">,</span> <span class="n">tile_size</span><span class="o">=</span><span class="mi">8</span><span class="p">):</span>
  560. <span class="w"> </span><span class="sd">&quot;&quot;&quot;A wrapper that makes the image observation a one-hot encoding of a partially observable agent view.</span>
  561. <span class="sd"> Args:</span>
  562. <span class="sd"> env: The environment to apply the wrapper</span>
  563. <span class="sd"> &quot;&quot;&quot;</span>
  564. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  565. <span class="bp">self</span><span class="o">.</span><span class="n">tile_size</span> <span class="o">=</span> <span class="n">tile_size</span>
  566. <span class="n">obs_shape</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">observation_space</span><span class="p">[</span><span class="s2">&quot;image&quot;</span><span class="p">]</span><span class="o">.</span><span class="n">shape</span>
  567. <span class="c1"># Number of bits per cell</span>
  568. <span class="n">num_bits</span> <span class="o">=</span> <span class="nb">len</span><span class="p">(</span><span class="n">OBJECT_TO_IDX</span><span class="p">)</span> <span class="o">+</span> <span class="nb">len</span><span class="p">(</span><span class="n">COLOR_TO_IDX</span><span class="p">)</span> <span class="o">+</span> <span class="nb">len</span><span class="p">(</span><span class="n">STATE_TO_IDX</span><span class="p">)</span>
  569. <span class="n">new_image_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Box</span><span class="p">(</span>
  570. <span class="n">low</span><span class="o">=</span><span class="mi">0</span><span class="p">,</span> <span class="n">high</span><span class="o">=</span><span class="mi">255</span><span class="p">,</span> <span class="n">shape</span><span class="o">=</span><span class="p">(</span><span class="n">obs_shape</span><span class="p">[</span><span class="mi">0</span><span class="p">],</span> <span class="n">obs_shape</span><span class="p">[</span><span class="mi">1</span><span class="p">],</span> <span class="n">num_bits</span><span class="p">),</span> <span class="n">dtype</span><span class="o">=</span><span class="s2">&quot;uint8&quot;</span>
  571. <span class="p">)</span>
  572. <span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Dict</span><span class="p">(</span>
  573. <span class="p">{</span><span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span><span class="o">.</span><span class="n">spaces</span><span class="p">,</span> <span class="s2">&quot;image&quot;</span><span class="p">:</span> <span class="n">new_image_space</span><span class="p">}</span>
  574. <span class="p">)</span>
  575. <span class="k">def</span> <span class="nf">observation</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">obs</span><span class="p">):</span>
  576. <span class="n">img</span> <span class="o">=</span> <span class="n">obs</span><span class="p">[</span><span class="s2">&quot;image&quot;</span><span class="p">]</span>
  577. <span class="n">out</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span><span class="o">.</span><span class="n">spaces</span><span class="p">[</span><span class="s2">&quot;image&quot;</span><span class="p">]</span><span class="o">.</span><span class="n">shape</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="s2">&quot;uint8&quot;</span><span class="p">)</span>
  578. <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">img</span><span class="o">.</span><span class="n">shape</span><span class="p">[</span><span class="mi">0</span><span class="p">]):</span>
  579. <span class="k">for</span> <span class="n">j</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">img</span><span class="o">.</span><span class="n">shape</span><span class="p">[</span><span class="mi">1</span><span class="p">]):</span>
  580. <span class="nb">type</span> <span class="o">=</span> <span class="n">img</span><span class="p">[</span><span class="n">i</span><span class="p">,</span> <span class="n">j</span><span class="p">,</span> <span class="mi">0</span><span class="p">]</span>
  581. <span class="n">color</span> <span class="o">=</span> <span class="n">img</span><span class="p">[</span><span class="n">i</span><span class="p">,</span> <span class="n">j</span><span class="p">,</span> <span class="mi">1</span><span class="p">]</span>
  582. <span class="n">state</span> <span class="o">=</span> <span class="n">img</span><span class="p">[</span><span class="n">i</span><span class="p">,</span> <span class="n">j</span><span class="p">,</span> <span class="mi">2</span><span class="p">]</span>
  583. <span class="n">out</span><span class="p">[</span><span class="n">i</span><span class="p">,</span> <span class="n">j</span><span class="p">,</span> <span class="nb">type</span><span class="p">]</span> <span class="o">=</span> <span class="mi">1</span>
  584. <span class="n">out</span><span class="p">[</span><span class="n">i</span><span class="p">,</span> <span class="n">j</span><span class="p">,</span> <span class="nb">len</span><span class="p">(</span><span class="n">OBJECT_TO_IDX</span><span class="p">)</span> <span class="o">+</span> <span class="n">color</span><span class="p">]</span> <span class="o">=</span> <span class="mi">1</span>
  585. <span class="n">out</span><span class="p">[</span><span class="n">i</span><span class="p">,</span> <span class="n">j</span><span class="p">,</span> <span class="nb">len</span><span class="p">(</span><span class="n">OBJECT_TO_IDX</span><span class="p">)</span> <span class="o">+</span> <span class="nb">len</span><span class="p">(</span><span class="n">COLOR_TO_IDX</span><span class="p">)</span> <span class="o">+</span> <span class="n">state</span><span class="p">]</span> <span class="o">=</span> <span class="mi">1</span>
  586. <span class="k">return</span> <span class="p">{</span><span class="o">**</span><span class="n">obs</span><span class="p">,</span> <span class="s2">&quot;image&quot;</span><span class="p">:</span> <span class="n">out</span><span class="p">}</span></div>
  587. <div class="viewcode-block" id="RGBImgObsWrapper">
  588. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.RGBImgObsWrapper">[docs]</a>
  589. <span class="k">class</span> <span class="nc">RGBImgObsWrapper</span><span class="p">(</span><span class="n">ObservationWrapper</span><span class="p">):</span>
  590. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  591. <span class="sd"> Wrapper to use fully observable RGB image as observation,</span>
  592. <span class="sd"> This can be used to have the agent to solve the gridworld in pixel space.</span>
  593. <span class="sd"> Example:</span>
  594. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  595. <span class="sd"> &gt;&gt;&gt; import matplotlib.pyplot as plt</span>
  596. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import RGBImgObsWrapper</span>
  597. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-Empty-5x5-v0&quot;)</span>
  598. <span class="sd"> &gt;&gt;&gt; obs, _ = env.reset()</span>
  599. <span class="sd"> &gt;&gt;&gt; plt.imshow(obs[&#39;image&#39;]) # doctest: +SKIP</span>
  600. <span class="sd"> ![NoWrapper](../figures/lavacrossing_NoWrapper.png)</span>
  601. <span class="sd"> &gt;&gt;&gt; env = RGBImgObsWrapper(env)</span>
  602. <span class="sd"> &gt;&gt;&gt; obs, _ = env.reset()</span>
  603. <span class="sd"> &gt;&gt;&gt; plt.imshow(obs[&#39;image&#39;]) # doctest: +SKIP</span>
  604. <span class="sd"> ![RGBImgObsWrapper](../figures/lavacrossing_RGBImgObsWrapper.png)</span>
  605. <span class="sd"> &quot;&quot;&quot;</span>
  606. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">,</span> <span class="n">tile_size</span><span class="o">=</span><span class="mi">8</span><span class="p">):</span>
  607. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  608. <span class="bp">self</span><span class="o">.</span><span class="n">tile_size</span> <span class="o">=</span> <span class="n">tile_size</span>
  609. <span class="n">new_image_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Box</span><span class="p">(</span>
  610. <span class="n">low</span><span class="o">=</span><span class="mi">0</span><span class="p">,</span>
  611. <span class="n">high</span><span class="o">=</span><span class="mi">255</span><span class="p">,</span>
  612. <span class="n">shape</span><span class="o">=</span><span class="p">(</span>
  613. <span class="bp">self</span><span class="o">.</span><span class="n">unwrapped</span><span class="o">.</span><span class="n">width</span> <span class="o">*</span> <span class="n">tile_size</span><span class="p">,</span>
  614. <span class="bp">self</span><span class="o">.</span><span class="n">unwrapped</span><span class="o">.</span><span class="n">height</span> <span class="o">*</span> <span class="n">tile_size</span><span class="p">,</span>
  615. <span class="mi">3</span><span class="p">,</span>
  616. <span class="p">),</span>
  617. <span class="n">dtype</span><span class="o">=</span><span class="s2">&quot;uint8&quot;</span><span class="p">,</span>
  618. <span class="p">)</span>
  619. <span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Dict</span><span class="p">(</span>
  620. <span class="p">{</span><span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span><span class="o">.</span><span class="n">spaces</span><span class="p">,</span> <span class="s2">&quot;image&quot;</span><span class="p">:</span> <span class="n">new_image_space</span><span class="p">}</span>
  621. <span class="p">)</span>
  622. <span class="k">def</span> <span class="nf">observation</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">obs</span><span class="p">):</span>
  623. <span class="n">rgb_img</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">get_frame</span><span class="p">(</span>
  624. <span class="n">highlight</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">unwrapped</span><span class="o">.</span><span class="n">highlight</span><span class="p">,</span> <span class="n">tile_size</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">tile_size</span>
  625. <span class="p">)</span>
  626. <span class="k">return</span> <span class="p">{</span><span class="o">**</span><span class="n">obs</span><span class="p">,</span> <span class="s2">&quot;image&quot;</span><span class="p">:</span> <span class="n">rgb_img</span><span class="p">}</span></div>
  627. <div class="viewcode-block" id="RGBImgPartialObsWrapper">
  628. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.RGBImgPartialObsWrapper">[docs]</a>
  629. <span class="k">class</span> <span class="nc">RGBImgPartialObsWrapper</span><span class="p">(</span><span class="n">ObservationWrapper</span><span class="p">):</span>
  630. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  631. <span class="sd"> Wrapper to use partially observable RGB image as observation.</span>
  632. <span class="sd"> This can be used to have the agent to solve the gridworld in pixel space.</span>
  633. <span class="sd"> Example:</span>
  634. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  635. <span class="sd"> &gt;&gt;&gt; import matplotlib.pyplot as plt</span>
  636. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import RGBImgObsWrapper, RGBImgPartialObsWrapper</span>
  637. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-LavaCrossingS11N5-v0&quot;)</span>
  638. <span class="sd"> &gt;&gt;&gt; obs, _ = env.reset()</span>
  639. <span class="sd"> &gt;&gt;&gt; plt.imshow(obs[&quot;image&quot;]) # doctest: +SKIP</span>
  640. <span class="sd"> ![NoWrapper](../figures/lavacrossing_NoWrapper.png)</span>
  641. <span class="sd"> &gt;&gt;&gt; env_obs = RGBImgObsWrapper(env)</span>
  642. <span class="sd"> &gt;&gt;&gt; obs, _ = env_obs.reset()</span>
  643. <span class="sd"> &gt;&gt;&gt; plt.imshow(obs[&quot;image&quot;]) # doctest: +SKIP</span>
  644. <span class="sd"> ![RGBImgObsWrapper](../figures/lavacrossing_RGBImgObsWrapper.png)</span>
  645. <span class="sd"> &gt;&gt;&gt; env_obs = RGBImgPartialObsWrapper(env)</span>
  646. <span class="sd"> &gt;&gt;&gt; obs, _ = env_obs.reset()</span>
  647. <span class="sd"> &gt;&gt;&gt; plt.imshow(obs[&quot;image&quot;]) # doctest: +SKIP</span>
  648. <span class="sd"> ![RGBImgPartialObsWrapper](../figures/lavacrossing_RGBImgPartialObsWrapper.png)</span>
  649. <span class="sd"> &quot;&quot;&quot;</span>
  650. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">,</span> <span class="n">tile_size</span><span class="o">=</span><span class="mi">8</span><span class="p">):</span>
  651. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  652. <span class="c1"># Rendering attributes for observations</span>
  653. <span class="bp">self</span><span class="o">.</span><span class="n">tile_size</span> <span class="o">=</span> <span class="n">tile_size</span>
  654. <span class="n">obs_shape</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">observation_space</span><span class="o">.</span><span class="n">spaces</span><span class="p">[</span><span class="s2">&quot;image&quot;</span><span class="p">]</span><span class="o">.</span><span class="n">shape</span>
  655. <span class="n">new_image_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Box</span><span class="p">(</span>
  656. <span class="n">low</span><span class="o">=</span><span class="mi">0</span><span class="p">,</span>
  657. <span class="n">high</span><span class="o">=</span><span class="mi">255</span><span class="p">,</span>
  658. <span class="n">shape</span><span class="o">=</span><span class="p">(</span><span class="n">obs_shape</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">*</span> <span class="n">tile_size</span><span class="p">,</span> <span class="n">obs_shape</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span> <span class="o">*</span> <span class="n">tile_size</span><span class="p">,</span> <span class="mi">3</span><span class="p">),</span>
  659. <span class="n">dtype</span><span class="o">=</span><span class="s2">&quot;uint8&quot;</span><span class="p">,</span>
  660. <span class="p">)</span>
  661. <span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Dict</span><span class="p">(</span>
  662. <span class="p">{</span><span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span><span class="o">.</span><span class="n">spaces</span><span class="p">,</span> <span class="s2">&quot;image&quot;</span><span class="p">:</span> <span class="n">new_image_space</span><span class="p">}</span>
  663. <span class="p">)</span>
  664. <span class="k">def</span> <span class="nf">observation</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">obs</span><span class="p">):</span>
  665. <span class="n">rgb_img_partial</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">get_frame</span><span class="p">(</span><span class="n">tile_size</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">tile_size</span><span class="p">,</span> <span class="n">agent_pov</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
  666. <span class="k">return</span> <span class="p">{</span><span class="o">**</span><span class="n">obs</span><span class="p">,</span> <span class="s2">&quot;image&quot;</span><span class="p">:</span> <span class="n">rgb_img_partial</span><span class="p">}</span></div>
  667. <div class="viewcode-block" id="FullyObsWrapper">
  668. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.FullyObsWrapper">[docs]</a>
  669. <span class="k">class</span> <span class="nc">FullyObsWrapper</span><span class="p">(</span><span class="n">ObservationWrapper</span><span class="p">):</span>
  670. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  671. <span class="sd"> Fully observable gridworld using a compact grid encoding instead of the agent view.</span>
  672. <span class="sd"> Example:</span>
  673. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  674. <span class="sd"> &gt;&gt;&gt; import matplotlib.pyplot as plt</span>
  675. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import FullyObsWrapper</span>
  676. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-LavaCrossingS11N5-v0&quot;)</span>
  677. <span class="sd"> &gt;&gt;&gt; obs, _ = env.reset()</span>
  678. <span class="sd"> &gt;&gt;&gt; obs[&#39;image&#39;].shape</span>
  679. <span class="sd"> (7, 7, 3)</span>
  680. <span class="sd"> &gt;&gt;&gt; env_obs = FullyObsWrapper(env)</span>
  681. <span class="sd"> &gt;&gt;&gt; obs, _ = env_obs.reset()</span>
  682. <span class="sd"> &gt;&gt;&gt; obs[&#39;image&#39;].shape</span>
  683. <span class="sd"> (11, 11, 3)</span>
  684. <span class="sd"> &quot;&quot;&quot;</span>
  685. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">):</span>
  686. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  687. <span class="n">new_image_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Box</span><span class="p">(</span>
  688. <span class="n">low</span><span class="o">=</span><span class="mi">0</span><span class="p">,</span>
  689. <span class="n">high</span><span class="o">=</span><span class="mi">255</span><span class="p">,</span>
  690. <span class="n">shape</span><span class="o">=</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">env</span><span class="o">.</span><span class="n">width</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">env</span><span class="o">.</span><span class="n">height</span><span class="p">,</span> <span class="mi">3</span><span class="p">),</span> <span class="c1"># number of cells</span>
  691. <span class="n">dtype</span><span class="o">=</span><span class="s2">&quot;uint8&quot;</span><span class="p">,</span>
  692. <span class="p">)</span>
  693. <span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Dict</span><span class="p">(</span>
  694. <span class="p">{</span><span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span><span class="o">.</span><span class="n">spaces</span><span class="p">,</span> <span class="s2">&quot;image&quot;</span><span class="p">:</span> <span class="n">new_image_space</span><span class="p">}</span>
  695. <span class="p">)</span>
  696. <span class="k">def</span> <span class="nf">observation</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">obs</span><span class="p">):</span>
  697. <span class="n">env</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">unwrapped</span>
  698. <span class="n">full_grid</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">grid</span><span class="o">.</span><span class="n">encode</span><span class="p">()</span>
  699. <span class="n">full_grid</span><span class="p">[</span><span class="n">env</span><span class="o">.</span><span class="n">agent_pos</span><span class="p">[</span><span class="mi">0</span><span class="p">]][</span><span class="n">env</span><span class="o">.</span><span class="n">agent_pos</span><span class="p">[</span><span class="mi">1</span><span class="p">]]</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">(</span>
  700. <span class="p">[</span><span class="n">OBJECT_TO_IDX</span><span class="p">[</span><span class="s2">&quot;agent&quot;</span><span class="p">],</span> <span class="n">COLOR_TO_IDX</span><span class="p">[</span><span class="s2">&quot;red&quot;</span><span class="p">],</span> <span class="n">env</span><span class="o">.</span><span class="n">agent_dir</span><span class="p">]</span>
  701. <span class="p">)</span>
  702. <span class="k">return</span> <span class="p">{</span><span class="o">**</span><span class="n">obs</span><span class="p">,</span> <span class="s2">&quot;image&quot;</span><span class="p">:</span> <span class="n">full_grid</span><span class="p">}</span></div>
  703. <div class="viewcode-block" id="DictObservationSpaceWrapper">
  704. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.DictObservationSpaceWrapper">[docs]</a>
  705. <span class="k">class</span> <span class="nc">DictObservationSpaceWrapper</span><span class="p">(</span><span class="n">ObservationWrapper</span><span class="p">):</span>
  706. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  707. <span class="sd"> Transforms the observation space (that has a textual component) to a fully numerical observation space,</span>
  708. <span class="sd"> where the textual instructions are replaced by arrays representing the indices of each word in a fixed vocabulary.</span>
  709. <span class="sd"> This wrapper is not applicable to BabyAI environments, given that these have their own language component.</span>
  710. <span class="sd"> Example:</span>
  711. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  712. <span class="sd"> &gt;&gt;&gt; import matplotlib.pyplot as plt</span>
  713. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import DictObservationSpaceWrapper</span>
  714. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-LavaCrossingS11N5-v0&quot;)</span>
  715. <span class="sd"> &gt;&gt;&gt; obs, _ = env.reset()</span>
  716. <span class="sd"> &gt;&gt;&gt; obs[&#39;mission&#39;]</span>
  717. <span class="sd"> &#39;avoid the lava and get to the green goal square&#39;</span>
  718. <span class="sd"> &gt;&gt;&gt; env_obs = DictObservationSpaceWrapper(env)</span>
  719. <span class="sd"> &gt;&gt;&gt; obs, _ = env_obs.reset()</span>
  720. <span class="sd"> &gt;&gt;&gt; obs[&#39;mission&#39;][:10]</span>
  721. <span class="sd"> [19, 31, 17, 36, 20, 38, 31, 2, 15, 35]</span>
  722. <span class="sd"> &quot;&quot;&quot;</span>
  723. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">,</span> <span class="n">max_words_in_mission</span><span class="o">=</span><span class="mi">50</span><span class="p">,</span> <span class="n">word_dict</span><span class="o">=</span><span class="kc">None</span><span class="p">):</span>
  724. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  725. <span class="sd"> max_words_in_mission is the length of the array to represent a mission, value 0 for missing words</span>
  726. <span class="sd"> word_dict is a dictionary of words to use (keys=words, values=indices from 1 to &lt; max_words_in_mission),</span>
  727. <span class="sd"> if None, use the Minigrid language</span>
  728. <span class="sd"> &quot;&quot;&quot;</span>
  729. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  730. <span class="k">if</span> <span class="n">word_dict</span> <span class="ow">is</span> <span class="kc">None</span><span class="p">:</span>
  731. <span class="n">word_dict</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">get_minigrid_words</span><span class="p">()</span>
  732. <span class="bp">self</span><span class="o">.</span><span class="n">max_words_in_mission</span> <span class="o">=</span> <span class="n">max_words_in_mission</span>
  733. <span class="bp">self</span><span class="o">.</span><span class="n">word_dict</span> <span class="o">=</span> <span class="n">word_dict</span>
  734. <span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Dict</span><span class="p">(</span>
  735. <span class="p">{</span>
  736. <span class="s2">&quot;image&quot;</span><span class="p">:</span> <span class="n">env</span><span class="o">.</span><span class="n">observation_space</span><span class="p">[</span><span class="s2">&quot;image&quot;</span><span class="p">],</span>
  737. <span class="s2">&quot;direction&quot;</span><span class="p">:</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Discrete</span><span class="p">(</span><span class="mi">4</span><span class="p">),</span>
  738. <span class="s2">&quot;mission&quot;</span><span class="p">:</span> <span class="n">spaces</span><span class="o">.</span><span class="n">MultiDiscrete</span><span class="p">(</span>
  739. <span class="p">[</span><span class="nb">len</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">word_dict</span><span class="o">.</span><span class="n">keys</span><span class="p">())]</span> <span class="o">*</span> <span class="n">max_words_in_mission</span>
  740. <span class="p">),</span>
  741. <span class="p">}</span>
  742. <span class="p">)</span>
  743. <span class="nd">@staticmethod</span>
  744. <span class="k">def</span> <span class="nf">get_minigrid_words</span><span class="p">():</span>
  745. <span class="n">colors</span> <span class="o">=</span> <span class="p">[</span><span class="s2">&quot;red&quot;</span><span class="p">,</span> <span class="s2">&quot;green&quot;</span><span class="p">,</span> <span class="s2">&quot;blue&quot;</span><span class="p">,</span> <span class="s2">&quot;yellow&quot;</span><span class="p">,</span> <span class="s2">&quot;purple&quot;</span><span class="p">,</span> <span class="s2">&quot;grey&quot;</span><span class="p">]</span>
  746. <span class="n">objects</span> <span class="o">=</span> <span class="p">[</span>
  747. <span class="s2">&quot;unseen&quot;</span><span class="p">,</span>
  748. <span class="s2">&quot;empty&quot;</span><span class="p">,</span>
  749. <span class="s2">&quot;wall&quot;</span><span class="p">,</span>
  750. <span class="s2">&quot;floor&quot;</span><span class="p">,</span>
  751. <span class="s2">&quot;box&quot;</span><span class="p">,</span>
  752. <span class="s2">&quot;key&quot;</span><span class="p">,</span>
  753. <span class="s2">&quot;ball&quot;</span><span class="p">,</span>
  754. <span class="s2">&quot;door&quot;</span><span class="p">,</span>
  755. <span class="s2">&quot;goal&quot;</span><span class="p">,</span>
  756. <span class="s2">&quot;agent&quot;</span><span class="p">,</span>
  757. <span class="s2">&quot;lava&quot;</span><span class="p">,</span>
  758. <span class="p">]</span>
  759. <span class="n">verbs</span> <span class="o">=</span> <span class="p">[</span>
  760. <span class="s2">&quot;pick&quot;</span><span class="p">,</span>
  761. <span class="s2">&quot;avoid&quot;</span><span class="p">,</span>
  762. <span class="s2">&quot;get&quot;</span><span class="p">,</span>
  763. <span class="s2">&quot;find&quot;</span><span class="p">,</span>
  764. <span class="s2">&quot;put&quot;</span><span class="p">,</span>
  765. <span class="s2">&quot;use&quot;</span><span class="p">,</span>
  766. <span class="s2">&quot;open&quot;</span><span class="p">,</span>
  767. <span class="s2">&quot;go&quot;</span><span class="p">,</span>
  768. <span class="s2">&quot;fetch&quot;</span><span class="p">,</span>
  769. <span class="s2">&quot;reach&quot;</span><span class="p">,</span>
  770. <span class="s2">&quot;unlock&quot;</span><span class="p">,</span>
  771. <span class="s2">&quot;traverse&quot;</span><span class="p">,</span>
  772. <span class="p">]</span>
  773. <span class="n">extra_words</span> <span class="o">=</span> <span class="p">[</span>
  774. <span class="s2">&quot;up&quot;</span><span class="p">,</span>
  775. <span class="s2">&quot;the&quot;</span><span class="p">,</span>
  776. <span class="s2">&quot;a&quot;</span><span class="p">,</span>
  777. <span class="s2">&quot;at&quot;</span><span class="p">,</span>
  778. <span class="s2">&quot;,&quot;</span><span class="p">,</span>
  779. <span class="s2">&quot;square&quot;</span><span class="p">,</span>
  780. <span class="s2">&quot;and&quot;</span><span class="p">,</span>
  781. <span class="s2">&quot;then&quot;</span><span class="p">,</span>
  782. <span class="s2">&quot;to&quot;</span><span class="p">,</span>
  783. <span class="s2">&quot;of&quot;</span><span class="p">,</span>
  784. <span class="s2">&quot;rooms&quot;</span><span class="p">,</span>
  785. <span class="s2">&quot;near&quot;</span><span class="p">,</span>
  786. <span class="s2">&quot;opening&quot;</span><span class="p">,</span>
  787. <span class="s2">&quot;must&quot;</span><span class="p">,</span>
  788. <span class="s2">&quot;you&quot;</span><span class="p">,</span>
  789. <span class="s2">&quot;matching&quot;</span><span class="p">,</span>
  790. <span class="s2">&quot;end&quot;</span><span class="p">,</span>
  791. <span class="s2">&quot;hallway&quot;</span><span class="p">,</span>
  792. <span class="s2">&quot;object&quot;</span><span class="p">,</span>
  793. <span class="s2">&quot;from&quot;</span><span class="p">,</span>
  794. <span class="s2">&quot;room&quot;</span><span class="p">,</span>
  795. <span class="s2">&quot;maze&quot;</span><span class="p">,</span>
  796. <span class="p">]</span>
  797. <span class="n">all_words</span> <span class="o">=</span> <span class="n">colors</span> <span class="o">+</span> <span class="n">objects</span> <span class="o">+</span> <span class="n">verbs</span> <span class="o">+</span> <span class="n">extra_words</span>
  798. <span class="k">assert</span> <span class="nb">len</span><span class="p">(</span><span class="n">all_words</span><span class="p">)</span> <span class="o">==</span> <span class="nb">len</span><span class="p">(</span><span class="nb">set</span><span class="p">(</span><span class="n">all_words</span><span class="p">))</span>
  799. <span class="k">return</span> <span class="p">{</span><span class="n">word</span><span class="p">:</span> <span class="n">i</span> <span class="k">for</span> <span class="n">i</span><span class="p">,</span> <span class="n">word</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">all_words</span><span class="p">)}</span>
  800. <span class="k">def</span> <span class="nf">string_to_indices</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">string</span><span class="p">,</span> <span class="n">offset</span><span class="o">=</span><span class="mi">1</span><span class="p">):</span>
  801. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  802. <span class="sd"> Convert a string to a list of indices.</span>
  803. <span class="sd"> &quot;&quot;&quot;</span>
  804. <span class="n">indices</span> <span class="o">=</span> <span class="p">[]</span>
  805. <span class="c1"># adding space before and after commas</span>
  806. <span class="n">string</span> <span class="o">=</span> <span class="n">string</span><span class="o">.</span><span class="n">replace</span><span class="p">(</span><span class="s2">&quot;,&quot;</span><span class="p">,</span> <span class="s2">&quot; , &quot;</span><span class="p">)</span>
  807. <span class="k">for</span> <span class="n">word</span> <span class="ow">in</span> <span class="n">string</span><span class="o">.</span><span class="n">split</span><span class="p">():</span>
  808. <span class="k">if</span> <span class="n">word</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">word_dict</span><span class="o">.</span><span class="n">keys</span><span class="p">():</span>
  809. <span class="n">indices</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">word_dict</span><span class="p">[</span><span class="n">word</span><span class="p">]</span> <span class="o">+</span> <span class="n">offset</span><span class="p">)</span>
  810. <span class="k">else</span><span class="p">:</span>
  811. <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;Unknown word: </span><span class="si">{</span><span class="n">word</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
  812. <span class="k">return</span> <span class="n">indices</span>
  813. <span class="k">def</span> <span class="nf">observation</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">obs</span><span class="p">):</span>
  814. <span class="n">obs</span><span class="p">[</span><span class="s2">&quot;mission&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">string_to_indices</span><span class="p">(</span><span class="n">obs</span><span class="p">[</span><span class="s2">&quot;mission&quot;</span><span class="p">])</span>
  815. <span class="k">assert</span> <span class="nb">len</span><span class="p">(</span><span class="n">obs</span><span class="p">[</span><span class="s2">&quot;mission&quot;</span><span class="p">])</span> <span class="o">&lt;</span> <span class="bp">self</span><span class="o">.</span><span class="n">max_words_in_mission</span>
  816. <span class="n">obs</span><span class="p">[</span><span class="s2">&quot;mission&quot;</span><span class="p">]</span> <span class="o">+=</span> <span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">*</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">max_words_in_mission</span> <span class="o">-</span> <span class="nb">len</span><span class="p">(</span><span class="n">obs</span><span class="p">[</span><span class="s2">&quot;mission&quot;</span><span class="p">]))</span>
  817. <span class="k">return</span> <span class="n">obs</span></div>
  818. <div class="viewcode-block" id="FlatObsWrapper">
  819. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.FlatObsWrapper">[docs]</a>
  820. <span class="k">class</span> <span class="nc">FlatObsWrapper</span><span class="p">(</span><span class="n">ObservationWrapper</span><span class="p">):</span>
  821. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  822. <span class="sd"> Encode mission strings using a one-hot scheme,</span>
  823. <span class="sd"> and combine these with observed images into one flat array.</span>
  824. <span class="sd"> This wrapper is not applicable to BabyAI environments, given that these have their own language component.</span>
  825. <span class="sd"> Example:</span>
  826. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  827. <span class="sd"> &gt;&gt;&gt; import matplotlib.pyplot as plt</span>
  828. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import FlatObsWrapper</span>
  829. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-LavaCrossingS11N5-v0&quot;)</span>
  830. <span class="sd"> &gt;&gt;&gt; env_obs = FlatObsWrapper(env)</span>
  831. <span class="sd"> &gt;&gt;&gt; obs, _ = env_obs.reset()</span>
  832. <span class="sd"> &gt;&gt;&gt; obs.shape</span>
  833. <span class="sd"> (2835,)</span>
  834. <span class="sd"> &quot;&quot;&quot;</span>
  835. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">,</span> <span class="n">maxStrLen</span><span class="o">=</span><span class="mi">96</span><span class="p">):</span>
  836. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  837. <span class="bp">self</span><span class="o">.</span><span class="n">maxStrLen</span> <span class="o">=</span> <span class="n">maxStrLen</span>
  838. <span class="bp">self</span><span class="o">.</span><span class="n">numCharCodes</span> <span class="o">=</span> <span class="mi">28</span>
  839. <span class="n">imgSpace</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">observation_space</span><span class="o">.</span><span class="n">spaces</span><span class="p">[</span><span class="s2">&quot;image&quot;</span><span class="p">]</span>
  840. <span class="n">imgSize</span> <span class="o">=</span> <span class="n">reduce</span><span class="p">(</span><span class="n">operator</span><span class="o">.</span><span class="n">mul</span><span class="p">,</span> <span class="n">imgSpace</span><span class="o">.</span><span class="n">shape</span><span class="p">,</span> <span class="mi">1</span><span class="p">)</span>
  841. <span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Box</span><span class="p">(</span>
  842. <span class="n">low</span><span class="o">=</span><span class="mi">0</span><span class="p">,</span>
  843. <span class="n">high</span><span class="o">=</span><span class="mi">255</span><span class="p">,</span>
  844. <span class="n">shape</span><span class="o">=</span><span class="p">(</span><span class="n">imgSize</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">numCharCodes</span> <span class="o">*</span> <span class="bp">self</span><span class="o">.</span><span class="n">maxStrLen</span><span class="p">,),</span>
  845. <span class="n">dtype</span><span class="o">=</span><span class="s2">&quot;uint8&quot;</span><span class="p">,</span>
  846. <span class="p">)</span>
  847. <span class="bp">self</span><span class="o">.</span><span class="n">cachedStr</span><span class="p">:</span> <span class="nb">str</span> <span class="o">=</span> <span class="kc">None</span>
  848. <span class="k">def</span> <span class="nf">observation</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">obs</span><span class="p">):</span>
  849. <span class="n">image</span> <span class="o">=</span> <span class="n">obs</span><span class="p">[</span><span class="s2">&quot;image&quot;</span><span class="p">]</span>
  850. <span class="n">mission</span> <span class="o">=</span> <span class="n">obs</span><span class="p">[</span><span class="s2">&quot;mission&quot;</span><span class="p">]</span>
  851. <span class="c1"># Cache the last-encoded mission string</span>
  852. <span class="k">if</span> <span class="n">mission</span> <span class="o">!=</span> <span class="bp">self</span><span class="o">.</span><span class="n">cachedStr</span><span class="p">:</span>
  853. <span class="k">assert</span> <span class="p">(</span>
  854. <span class="nb">len</span><span class="p">(</span><span class="n">mission</span><span class="p">)</span> <span class="o">&lt;=</span> <span class="bp">self</span><span class="o">.</span><span class="n">maxStrLen</span>
  855. <span class="p">),</span> <span class="sa">f</span><span class="s2">&quot;mission string too long (</span><span class="si">{</span><span class="nb">len</span><span class="p">(</span><span class="n">mission</span><span class="p">)</span><span class="si">}</span><span class="s2"> chars)&quot;</span>
  856. <span class="n">mission</span> <span class="o">=</span> <span class="n">mission</span><span class="o">.</span><span class="n">lower</span><span class="p">()</span>
  857. <span class="n">strArray</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span>
  858. <span class="n">shape</span><span class="o">=</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">maxStrLen</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">numCharCodes</span><span class="p">),</span> <span class="n">dtype</span><span class="o">=</span><span class="s2">&quot;float32&quot;</span>
  859. <span class="p">)</span>
  860. <span class="k">for</span> <span class="n">idx</span><span class="p">,</span> <span class="n">ch</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">mission</span><span class="p">):</span>
  861. <span class="k">if</span> <span class="n">ch</span> <span class="o">&gt;=</span> <span class="s2">&quot;a&quot;</span> <span class="ow">and</span> <span class="n">ch</span> <span class="o">&lt;=</span> <span class="s2">&quot;z&quot;</span><span class="p">:</span>
  862. <span class="n">chNo</span> <span class="o">=</span> <span class="nb">ord</span><span class="p">(</span><span class="n">ch</span><span class="p">)</span> <span class="o">-</span> <span class="nb">ord</span><span class="p">(</span><span class="s2">&quot;a&quot;</span><span class="p">)</span>
  863. <span class="k">elif</span> <span class="n">ch</span> <span class="o">==</span> <span class="s2">&quot; &quot;</span><span class="p">:</span>
  864. <span class="n">chNo</span> <span class="o">=</span> <span class="nb">ord</span><span class="p">(</span><span class="s2">&quot;z&quot;</span><span class="p">)</span> <span class="o">-</span> <span class="nb">ord</span><span class="p">(</span><span class="s2">&quot;a&quot;</span><span class="p">)</span> <span class="o">+</span> <span class="mi">1</span>
  865. <span class="k">elif</span> <span class="n">ch</span> <span class="o">==</span> <span class="s2">&quot;,&quot;</span><span class="p">:</span>
  866. <span class="n">chNo</span> <span class="o">=</span> <span class="nb">ord</span><span class="p">(</span><span class="s2">&quot;z&quot;</span><span class="p">)</span> <span class="o">-</span> <span class="nb">ord</span><span class="p">(</span><span class="s2">&quot;a&quot;</span><span class="p">)</span> <span class="o">+</span> <span class="mi">2</span>
  867. <span class="k">else</span><span class="p">:</span>
  868. <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span>
  869. <span class="sa">f</span><span class="s2">&quot;Character </span><span class="si">{</span><span class="n">ch</span><span class="si">}</span><span class="s2"> is not available in mission string.&quot;</span>
  870. <span class="p">)</span>
  871. <span class="k">assert</span> <span class="n">chNo</span> <span class="o">&lt;</span> <span class="bp">self</span><span class="o">.</span><span class="n">numCharCodes</span><span class="p">,</span> <span class="s2">&quot;</span><span class="si">%s</span><span class="s2"> : </span><span class="si">%d</span><span class="s2">&quot;</span> <span class="o">%</span> <span class="p">(</span><span class="n">ch</span><span class="p">,</span> <span class="n">chNo</span><span class="p">)</span>
  872. <span class="n">strArray</span><span class="p">[</span><span class="n">idx</span><span class="p">,</span> <span class="n">chNo</span><span class="p">]</span> <span class="o">=</span> <span class="mi">1</span>
  873. <span class="bp">self</span><span class="o">.</span><span class="n">cachedStr</span> <span class="o">=</span> <span class="n">mission</span>
  874. <span class="bp">self</span><span class="o">.</span><span class="n">cachedArray</span> <span class="o">=</span> <span class="n">strArray</span>
  875. <span class="n">obs</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">concatenate</span><span class="p">((</span><span class="n">image</span><span class="o">.</span><span class="n">flatten</span><span class="p">(),</span> <span class="bp">self</span><span class="o">.</span><span class="n">cachedArray</span><span class="o">.</span><span class="n">flatten</span><span class="p">()))</span>
  876. <span class="k">return</span> <span class="n">obs</span></div>
  877. <div class="viewcode-block" id="ViewSizeWrapper">
  878. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.ViewSizeWrapper">[docs]</a>
  879. <span class="k">class</span> <span class="nc">ViewSizeWrapper</span><span class="p">(</span><span class="n">ObservationWrapper</span><span class="p">):</span>
  880. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  881. <span class="sd"> Wrapper to customize the agent field of view size.</span>
  882. <span class="sd"> This cannot be used with fully observable wrappers.</span>
  883. <span class="sd"> Example:</span>
  884. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  885. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import ViewSizeWrapper</span>
  886. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-LavaCrossingS11N5-v0&quot;)</span>
  887. <span class="sd"> &gt;&gt;&gt; obs, _ = env.reset()</span>
  888. <span class="sd"> &gt;&gt;&gt; obs[&#39;image&#39;].shape</span>
  889. <span class="sd"> (7, 7, 3)</span>
  890. <span class="sd"> &gt;&gt;&gt; env_obs = ViewSizeWrapper(env, agent_view_size=5)</span>
  891. <span class="sd"> &gt;&gt;&gt; obs, _ = env_obs.reset()</span>
  892. <span class="sd"> &gt;&gt;&gt; obs[&#39;image&#39;].shape</span>
  893. <span class="sd"> (5, 5, 3)</span>
  894. <span class="sd"> &quot;&quot;&quot;</span>
  895. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">,</span> <span class="n">agent_view_size</span><span class="o">=</span><span class="mi">7</span><span class="p">):</span>
  896. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  897. <span class="k">assert</span> <span class="n">agent_view_size</span> <span class="o">%</span> <span class="mi">2</span> <span class="o">==</span> <span class="mi">1</span>
  898. <span class="k">assert</span> <span class="n">agent_view_size</span> <span class="o">&gt;=</span> <span class="mi">3</span>
  899. <span class="bp">self</span><span class="o">.</span><span class="n">agent_view_size</span> <span class="o">=</span> <span class="n">agent_view_size</span>
  900. <span class="c1"># Compute observation space with specified view size</span>
  901. <span class="n">new_image_space</span> <span class="o">=</span> <span class="n">gym</span><span class="o">.</span><span class="n">spaces</span><span class="o">.</span><span class="n">Box</span><span class="p">(</span>
  902. <span class="n">low</span><span class="o">=</span><span class="mi">0</span><span class="p">,</span> <span class="n">high</span><span class="o">=</span><span class="mi">255</span><span class="p">,</span> <span class="n">shape</span><span class="o">=</span><span class="p">(</span><span class="n">agent_view_size</span><span class="p">,</span> <span class="n">agent_view_size</span><span class="p">,</span> <span class="mi">3</span><span class="p">),</span> <span class="n">dtype</span><span class="o">=</span><span class="s2">&quot;uint8&quot;</span>
  903. <span class="p">)</span>
  904. <span class="c1"># Override the environment&#39;s observation spaceexit</span>
  905. <span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Dict</span><span class="p">(</span>
  906. <span class="p">{</span><span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span><span class="o">.</span><span class="n">spaces</span><span class="p">,</span> <span class="s2">&quot;image&quot;</span><span class="p">:</span> <span class="n">new_image_space</span><span class="p">}</span>
  907. <span class="p">)</span>
  908. <span class="k">def</span> <span class="nf">observation</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">obs</span><span class="p">):</span>
  909. <span class="n">env</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">unwrapped</span>
  910. <span class="n">grid</span><span class="p">,</span> <span class="n">vis_mask</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">gen_obs_grid</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">agent_view_size</span><span class="p">)</span>
  911. <span class="c1"># Encode the partially observable view into a numpy array</span>
  912. <span class="n">image</span> <span class="o">=</span> <span class="n">grid</span><span class="o">.</span><span class="n">encode</span><span class="p">(</span><span class="n">vis_mask</span><span class="p">)</span>
  913. <span class="k">return</span> <span class="p">{</span><span class="o">**</span><span class="n">obs</span><span class="p">,</span> <span class="s2">&quot;image&quot;</span><span class="p">:</span> <span class="n">image</span><span class="p">}</span></div>
  914. <div class="viewcode-block" id="DirectionObsWrapper">
  915. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.DirectionObsWrapper">[docs]</a>
  916. <span class="k">class</span> <span class="nc">DirectionObsWrapper</span><span class="p">(</span><span class="n">ObservationWrapper</span><span class="p">):</span>
  917. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  918. <span class="sd"> Provides the slope/angular direction to the goal with the observations as modeled by (y2 - y2 )/( x2 - x1)</span>
  919. <span class="sd"> type = {slope , angle}</span>
  920. <span class="sd"> Example:</span>
  921. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  922. <span class="sd"> &gt;&gt;&gt; import matplotlib.pyplot as plt</span>
  923. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import DirectionObsWrapper</span>
  924. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-LavaCrossingS11N5-v0&quot;)</span>
  925. <span class="sd"> &gt;&gt;&gt; env_obs = DirectionObsWrapper(env, type=&quot;slope&quot;)</span>
  926. <span class="sd"> &gt;&gt;&gt; obs, _ = env_obs.reset()</span>
  927. <span class="sd"> &gt;&gt;&gt; obs[&#39;goal_direction&#39;]</span>
  928. <span class="sd"> 1.0</span>
  929. <span class="sd"> &quot;&quot;&quot;</span>
  930. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">,</span> <span class="nb">type</span><span class="o">=</span><span class="s2">&quot;slope&quot;</span><span class="p">):</span>
  931. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  932. <span class="bp">self</span><span class="o">.</span><span class="n">goal_position</span><span class="p">:</span> <span class="nb">tuple</span> <span class="o">=</span> <span class="kc">None</span>
  933. <span class="bp">self</span><span class="o">.</span><span class="n">type</span> <span class="o">=</span> <span class="nb">type</span>
  934. <span class="k">def</span> <span class="nf">reset</span><span class="p">(</span>
  935. <span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">seed</span><span class="p">:</span> <span class="nb">int</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span><span class="p">,</span> <span class="n">options</span><span class="p">:</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">]</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span>
  936. <span class="p">)</span> <span class="o">-&gt;</span> <span class="nb">tuple</span><span class="p">[</span><span class="n">ObsType</span><span class="p">,</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">]]:</span>
  937. <span class="n">obs</span><span class="p">,</span> <span class="n">info</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">env</span><span class="o">.</span><span class="n">reset</span><span class="p">()</span>
  938. <span class="k">if</span> <span class="ow">not</span> <span class="bp">self</span><span class="o">.</span><span class="n">goal_position</span><span class="p">:</span>
  939. <span class="bp">self</span><span class="o">.</span><span class="n">goal_position</span> <span class="o">=</span> <span class="p">[</span>
  940. <span class="n">x</span> <span class="k">for</span> <span class="n">x</span><span class="p">,</span> <span class="n">y</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">grid</span><span class="o">.</span><span class="n">grid</span><span class="p">)</span> <span class="k">if</span> <span class="nb">isinstance</span><span class="p">(</span><span class="n">y</span><span class="p">,</span> <span class="n">Goal</span><span class="p">)</span>
  941. <span class="p">]</span>
  942. <span class="c1"># in case there are multiple goals , needs to be handled for other env types</span>
  943. <span class="k">if</span> <span class="nb">len</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">goal_position</span><span class="p">)</span> <span class="o">&gt;=</span> <span class="mi">1</span><span class="p">:</span>
  944. <span class="bp">self</span><span class="o">.</span><span class="n">goal_position</span> <span class="o">=</span> <span class="p">(</span>
  945. <span class="nb">int</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">goal_position</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">/</span> <span class="bp">self</span><span class="o">.</span><span class="n">height</span><span class="p">),</span>
  946. <span class="bp">self</span><span class="o">.</span><span class="n">goal_position</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">%</span> <span class="bp">self</span><span class="o">.</span><span class="n">width</span><span class="p">,</span>
  947. <span class="p">)</span>
  948. <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">observation</span><span class="p">(</span><span class="n">obs</span><span class="p">),</span> <span class="n">info</span>
  949. <span class="k">def</span> <span class="nf">observation</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">obs</span><span class="p">):</span>
  950. <span class="n">slope</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">divide</span><span class="p">(</span>
  951. <span class="bp">self</span><span class="o">.</span><span class="n">goal_position</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">agent_pos</span><span class="p">[</span><span class="mi">1</span><span class="p">],</span>
  952. <span class="bp">self</span><span class="o">.</span><span class="n">goal_position</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">agent_pos</span><span class="p">[</span><span class="mi">0</span><span class="p">],</span>
  953. <span class="p">)</span>
  954. <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">type</span> <span class="o">==</span> <span class="s2">&quot;angle&quot;</span><span class="p">:</span>
  955. <span class="n">obs</span><span class="p">[</span><span class="s2">&quot;goal_direction&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">arctan</span><span class="p">(</span><span class="n">slope</span><span class="p">)</span>
  956. <span class="k">else</span><span class="p">:</span>
  957. <span class="n">obs</span><span class="p">[</span><span class="s2">&quot;goal_direction&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="n">slope</span>
  958. <span class="k">return</span> <span class="n">obs</span></div>
  959. <div class="viewcode-block" id="SymbolicObsWrapper">
  960. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.SymbolicObsWrapper">[docs]</a>
  961. <span class="k">class</span> <span class="nc">SymbolicObsWrapper</span><span class="p">(</span><span class="n">ObservationWrapper</span><span class="p">):</span>
  962. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  963. <span class="sd"> Fully observable grid with a symbolic state representation.</span>
  964. <span class="sd"> The symbol is a triple of (X, Y, IDX), where X and Y are</span>
  965. <span class="sd"> the coordinates on the grid, and IDX is the id of the object.</span>
  966. <span class="sd"> Example:</span>
  967. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  968. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import SymbolicObsWrapper</span>
  969. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-LavaCrossingS11N5-v0&quot;)</span>
  970. <span class="sd"> &gt;&gt;&gt; obs, _ = env.reset()</span>
  971. <span class="sd"> &gt;&gt;&gt; obs[&#39;image&#39;].shape</span>
  972. <span class="sd"> (7, 7, 3)</span>
  973. <span class="sd"> &gt;&gt;&gt; env_obs = SymbolicObsWrapper(env)</span>
  974. <span class="sd"> &gt;&gt;&gt; obs, _ = env_obs.reset()</span>
  975. <span class="sd"> &gt;&gt;&gt; obs[&#39;image&#39;].shape</span>
  976. <span class="sd"> (11, 11, 3)</span>
  977. <span class="sd"> &quot;&quot;&quot;</span>
  978. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">):</span>
  979. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  980. <span class="n">new_image_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Box</span><span class="p">(</span>
  981. <span class="n">low</span><span class="o">=</span><span class="mi">0</span><span class="p">,</span>
  982. <span class="n">high</span><span class="o">=</span><span class="nb">max</span><span class="p">(</span><span class="n">OBJECT_TO_IDX</span><span class="o">.</span><span class="n">values</span><span class="p">()),</span>
  983. <span class="n">shape</span><span class="o">=</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">env</span><span class="o">.</span><span class="n">width</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">env</span><span class="o">.</span><span class="n">height</span><span class="p">,</span> <span class="mi">3</span><span class="p">),</span> <span class="c1"># number of cells</span>
  984. <span class="n">dtype</span><span class="o">=</span><span class="s2">&quot;uint8&quot;</span><span class="p">,</span>
  985. <span class="p">)</span>
  986. <span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span> <span class="o">=</span> <span class="n">spaces</span><span class="o">.</span><span class="n">Dict</span><span class="p">(</span>
  987. <span class="p">{</span><span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">observation_space</span><span class="o">.</span><span class="n">spaces</span><span class="p">,</span> <span class="s2">&quot;image&quot;</span><span class="p">:</span> <span class="n">new_image_space</span><span class="p">}</span>
  988. <span class="p">)</span>
  989. <span class="k">def</span> <span class="nf">observation</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">obs</span><span class="p">):</span>
  990. <span class="n">objects</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">(</span>
  991. <span class="p">[</span><span class="n">OBJECT_TO_IDX</span><span class="p">[</span><span class="n">o</span><span class="o">.</span><span class="n">type</span><span class="p">]</span> <span class="k">if</span> <span class="n">o</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="k">else</span> <span class="o">-</span><span class="mi">1</span> <span class="k">for</span> <span class="n">o</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">grid</span><span class="o">.</span><span class="n">grid</span><span class="p">]</span>
  992. <span class="p">)</span>
  993. <span class="n">agent_pos</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">env</span><span class="o">.</span><span class="n">agent_pos</span>
  994. <span class="n">ncol</span><span class="p">,</span> <span class="n">nrow</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">width</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">height</span>
  995. <span class="n">grid</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">mgrid</span><span class="p">[:</span><span class="n">ncol</span><span class="p">,</span> <span class="p">:</span><span class="n">nrow</span><span class="p">]</span>
  996. <span class="n">_objects</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">transpose</span><span class="p">(</span><span class="n">objects</span><span class="o">.</span><span class="n">reshape</span><span class="p">(</span><span class="mi">1</span><span class="p">,</span> <span class="n">nrow</span><span class="p">,</span> <span class="n">ncol</span><span class="p">),</span> <span class="p">(</span><span class="mi">0</span><span class="p">,</span> <span class="mi">2</span><span class="p">,</span> <span class="mi">1</span><span class="p">))</span>
  997. <span class="n">grid</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">concatenate</span><span class="p">([</span><span class="n">grid</span><span class="p">,</span> <span class="n">_objects</span><span class="p">])</span>
  998. <span class="n">grid</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">transpose</span><span class="p">(</span><span class="n">grid</span><span class="p">,</span> <span class="p">(</span><span class="mi">1</span><span class="p">,</span> <span class="mi">2</span><span class="p">,</span> <span class="mi">0</span><span class="p">))</span>
  999. <span class="n">grid</span><span class="p">[</span><span class="n">agent_pos</span><span class="p">[</span><span class="mi">0</span><span class="p">],</span> <span class="n">agent_pos</span><span class="p">[</span><span class="mi">1</span><span class="p">],</span> <span class="mi">2</span><span class="p">]</span> <span class="o">=</span> <span class="n">OBJECT_TO_IDX</span><span class="p">[</span><span class="s2">&quot;agent&quot;</span><span class="p">]</span>
  1000. <span class="n">obs</span><span class="p">[</span><span class="s2">&quot;image&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="n">grid</span>
  1001. <span class="k">return</span> <span class="n">obs</span></div>
  1002. <div class="viewcode-block" id="StochasticActionWrapper">
  1003. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.StochasticActionWrapper">[docs]</a>
  1004. <span class="k">class</span> <span class="nc">StochasticActionWrapper</span><span class="p">(</span><span class="n">ActionWrapper</span><span class="p">):</span>
  1005. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  1006. <span class="sd"> Add stochasticity to the actions</span>
  1007. <span class="sd"> If a random action is provided, it is returned with probability `1 - prob`.</span>
  1008. <span class="sd"> Else, a random action is sampled from the action space.</span>
  1009. <span class="sd"> &quot;&quot;&quot;</span>
  1010. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span> <span class="n">prob</span><span class="o">=</span><span class="mf">0.9</span><span class="p">,</span> <span class="n">random_action</span><span class="o">=</span><span class="kc">None</span><span class="p">):</span>
  1011. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  1012. <span class="bp">self</span><span class="o">.</span><span class="n">prob</span> <span class="o">=</span> <span class="n">prob</span>
  1013. <span class="bp">self</span><span class="o">.</span><span class="n">random_action</span> <span class="o">=</span> <span class="n">random_action</span>
  1014. <span class="k">def</span> <span class="nf">action</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">action</span><span class="p">):</span>
  1015. <span class="w"> </span><span class="sd">&quot;&quot;&quot; &quot;&quot;&quot;</span>
  1016. <span class="k">if</span> <span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">uniform</span><span class="p">()</span> <span class="o">&lt;</span> <span class="bp">self</span><span class="o">.</span><span class="n">prob</span><span class="p">:</span>
  1017. <span class="k">return</span> <span class="n">action</span>
  1018. <span class="k">else</span><span class="p">:</span>
  1019. <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">random_action</span> <span class="ow">is</span> <span class="kc">None</span><span class="p">:</span>
  1020. <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">np_random</span><span class="o">.</span><span class="n">integers</span><span class="p">(</span><span class="mi">0</span><span class="p">,</span> <span class="n">high</span><span class="o">=</span><span class="mi">6</span><span class="p">)</span>
  1021. <span class="k">else</span><span class="p">:</span>
  1022. <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">random_action</span></div>
  1023. <div class="viewcode-block" id="NoDeath">
  1024. <a class="viewcode-back" href="../../../api/wrappers/#minigrid.wrappers.NoDeath">[docs]</a>
  1025. <span class="k">class</span> <span class="nc">NoDeath</span><span class="p">(</span><span class="n">Wrapper</span><span class="p">):</span>
  1026. <span class="w"> </span><span class="sd">&quot;&quot;&quot;</span>
  1027. <span class="sd"> Wrapper to prevent death in specific cells (e.g., lava cells).</span>
  1028. <span class="sd"> Instead of dying, the agent will receive a negative reward.</span>
  1029. <span class="sd"> Example:</span>
  1030. <span class="sd"> &gt;&gt;&gt; import gymnasium as gym</span>
  1031. <span class="sd"> &gt;&gt;&gt; from minigrid.wrappers import NoDeath</span>
  1032. <span class="sd"> &gt;&gt;&gt;</span>
  1033. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-LavaCrossingS9N1-v0&quot;)</span>
  1034. <span class="sd"> &gt;&gt;&gt; _, _ = env.reset(seed=2)</span>
  1035. <span class="sd"> &gt;&gt;&gt; _, _, _, _, _ = env.step(1)</span>
  1036. <span class="sd"> &gt;&gt;&gt; _, reward, term, *_ = env.step(2)</span>
  1037. <span class="sd"> &gt;&gt;&gt; reward, term</span>
  1038. <span class="sd"> (0, True)</span>
  1039. <span class="sd"> &gt;&gt;&gt;</span>
  1040. <span class="sd"> &gt;&gt;&gt; env = NoDeath(env, no_death_types=(&quot;lava&quot;,), death_cost=-1.0)</span>
  1041. <span class="sd"> &gt;&gt;&gt; _, _ = env.reset(seed=2)</span>
  1042. <span class="sd"> &gt;&gt;&gt; _, _, _, _, _ = env.step(1)</span>
  1043. <span class="sd"> &gt;&gt;&gt; _, reward, term, *_ = env.step(2)</span>
  1044. <span class="sd"> &gt;&gt;&gt; reward, term</span>
  1045. <span class="sd"> (-1.0, False)</span>
  1046. <span class="sd"> &gt;&gt;&gt;</span>
  1047. <span class="sd"> &gt;&gt;&gt;</span>
  1048. <span class="sd"> &gt;&gt;&gt; env = gym.make(&quot;MiniGrid-Dynamic-Obstacles-5x5-v0&quot;)</span>
  1049. <span class="sd"> &gt;&gt;&gt; _, _ = env.reset(seed=2)</span>
  1050. <span class="sd"> &gt;&gt;&gt; _, reward, term, *_ = env.step(2)</span>
  1051. <span class="sd"> &gt;&gt;&gt; reward, term</span>
  1052. <span class="sd"> (-1, True)</span>
  1053. <span class="sd"> &gt;&gt;&gt;</span>
  1054. <span class="sd"> &gt;&gt;&gt; env = NoDeath(env, no_death_types=(&quot;ball&quot;,), death_cost=-1.0)</span>
  1055. <span class="sd"> &gt;&gt;&gt; _, _ = env.reset(seed=2)</span>
  1056. <span class="sd"> &gt;&gt;&gt; _, reward, term, *_ = env.step(2)</span>
  1057. <span class="sd"> &gt;&gt;&gt; reward, term</span>
  1058. <span class="sd"> (-2.0, False)</span>
  1059. <span class="sd"> &quot;&quot;&quot;</span>
  1060. <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">,</span> <span class="n">no_death_types</span><span class="p">:</span> <span class="nb">tuple</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="o">...</span><span class="p">],</span> <span class="n">death_cost</span><span class="p">:</span> <span class="nb">float</span> <span class="o">=</span> <span class="o">-</span><span class="mf">1.0</span><span class="p">):</span>
  1061. <span class="w"> </span><span class="sd">&quot;&quot;&quot;A wrapper to prevent death in specific cells.</span>
  1062. <span class="sd"> Args:</span>
  1063. <span class="sd"> env: The environment to apply the wrapper</span>
  1064. <span class="sd"> no_death_types: List of strings to identify death cells</span>
  1065. <span class="sd"> death_cost: The negative reward received in death cells</span>
  1066. <span class="sd"> &quot;&quot;&quot;</span>
  1067. <span class="k">assert</span> <span class="s2">&quot;goal&quot;</span> <span class="ow">not</span> <span class="ow">in</span> <span class="n">no_death_types</span><span class="p">,</span> <span class="s2">&quot;goal cannot be a death cell&quot;</span>
  1068. <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
  1069. <span class="bp">self</span><span class="o">.</span><span class="n">death_cost</span> <span class="o">=</span> <span class="n">death_cost</span>
  1070. <span class="bp">self</span><span class="o">.</span><span class="n">no_death_types</span> <span class="o">=</span> <span class="n">no_death_types</span>
  1071. <span class="k">def</span> <span class="nf">step</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">action</span><span class="p">):</span>
  1072. <span class="c1"># In Dynamic-Obstacles, obstacles move after the agent moves,</span>
  1073. <span class="c1"># so we need to check for collision before self.env.step()</span>
  1074. <span class="n">front_cell</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">grid</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="o">*</span><span class="bp">self</span><span class="o">.</span><span class="n">front_pos</span><span class="p">)</span>
  1075. <span class="n">going_to_death</span> <span class="o">=</span> <span class="p">(</span>
  1076. <span class="n">action</span> <span class="o">==</span> <span class="bp">self</span><span class="o">.</span><span class="n">actions</span><span class="o">.</span><span class="n">forward</span>
  1077. <span class="ow">and</span> <span class="n">front_cell</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
  1078. <span class="ow">and</span> <span class="n">front_cell</span><span class="o">.</span><span class="n">type</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">no_death_types</span>
  1079. <span class="p">)</span>
  1080. <span class="n">obs</span><span class="p">,</span> <span class="n">reward</span><span class="p">,</span> <span class="n">terminated</span><span class="p">,</span> <span class="n">truncated</span><span class="p">,</span> <span class="n">info</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">env</span><span class="o">.</span><span class="n">step</span><span class="p">(</span><span class="n">action</span><span class="p">)</span>
  1081. <span class="c1"># We also check if the agent stays in death cells (e.g., lava)</span>
  1082. <span class="c1"># without moving</span>
  1083. <span class="n">current_cell</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">grid</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="o">*</span><span class="bp">self</span><span class="o">.</span><span class="n">agent_pos</span><span class="p">)</span>
  1084. <span class="n">in_death</span> <span class="o">=</span> <span class="n">current_cell</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="ow">and</span> <span class="n">current_cell</span><span class="o">.</span><span class="n">type</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">no_death_types</span>
  1085. <span class="k">if</span> <span class="n">terminated</span> <span class="ow">and</span> <span class="p">(</span><span class="n">going_to_death</span> <span class="ow">or</span> <span class="n">in_death</span><span class="p">):</span>
  1086. <span class="n">terminated</span> <span class="o">=</span> <span class="kc">False</span>
  1087. <span class="n">reward</span> <span class="o">+=</span> <span class="bp">self</span><span class="o">.</span><span class="n">death_cost</span>
  1088. <span class="k">return</span> <span class="n">obs</span><span class="p">,</span> <span class="n">reward</span><span class="p">,</span> <span class="n">terminated</span><span class="p">,</span> <span class="n">truncated</span><span class="p">,</span> <span class="n">info</span></div>
  1089. </pre></div>
  1090. </article>
  1091. </div>
  1092. <footer>
  1093. <div class="related-pages">
  1094. </div>
  1095. <div class="bottom-of-page">
  1096. <div class="left-details">
  1097. <div class="copyright">
  1098. Copyright &#169; 2023 Farama Foundation
  1099. </div>
  1100. <!--
  1101. Made with <a href="https://www.sphinx-doc.org/">Sphinx</a> and <a class="muted-link" href="https://pradyunsg.me">@pradyunsg</a>'s
  1102. <a href="https://github.com/pradyunsg/furo">Furo</a>
  1103. -->
  1104. </div>
  1105. <div class="right-details">
  1106. <div class="icons">
  1107. <a class="muted-link" href="https://github.com/Farama-Foundation/Minigrid/"
  1108. aria-label="On GitHub">
  1109. <svg stroke="currentColor" fill="currentColor" stroke-width="0" viewBox="0 0 16 16">
  1110. <path fill-rule="evenodd"
  1111. d="M8 0C3.58 0 0 3.58 0 8c0 3.54 2.29 6.53 5.47 7.59.4.07.55-.17.55-.38 0-.19-.01-.82-.01-1.49-2.01.37-2.53-.49-2.69-.94-.09-.23-.48-.94-.82-1.13-.28-.15-.68-.52-.01-.53.63-.01 1.08.58 1.23.82.72 1.21 1.87.87 2.33.66.07-.52.28-.87.51-1.07-1.78-.2-3.64-.89-3.64-3.95 0-.87.31-1.59.82-2.15-.08-.2-.36-1.02.08-2.12 0 0 .67-.21 2.2.82.64-.18 1.32-.27 2-.27.68 0 1.36.09 2 .27 1.53-1.04 2.2-.82 2.2-.82.44 1.1.16 1.92.08 2.12.51.56.82 1.27.82 2.15 0 3.07-1.87 3.75-3.65 3.95.29.25.54.73.54 1.48 0 1.07-.01 1.93-.01 2.2 0 .21.15.46.55.38A8.013 8.013 0 0 0 16 8c0-4.42-3.58-8-8-8z">
  1112. </path>
  1113. </svg>
  1114. </a>
  1115. </div>
  1116. </div>
  1117. </div>
  1118. </footer>
  1119. </div>
  1120. <aside class="toc-drawer no-toc">
  1121. </aside>
  1122. </div>
  1123. </div>
  1124. </div>
  1125. <script>
  1126. const toggleMenu = () => {
  1127. const menuBtn = document.querySelector(".farama-header-menu__btn");
  1128. const menuContainer = document.querySelector(".farama-header-menu-container");
  1129. if (document.querySelector(".farama-header-menu").classList.contains("active")) {
  1130. menuBtn.setAttribute("aria-expanded", "false");
  1131. menuContainer.setAttribute("aria-hidden", "true");
  1132. } else {
  1133. menuBtn.setAttribute("aria-expanded", "true");
  1134. menuContainer.setAttribute("aria-hidden", "false");
  1135. }
  1136. document.querySelector(".farama-header-menu").classList.toggle("active");
  1137. }
  1138. document.querySelector(".farama-header-menu__btn").addEventListener("click", toggleMenu);
  1139. document.getElementById("farama-close-menu").addEventListener("click", toggleMenu);
  1140. </script>
  1141. <script async src="https://www.googletagmanager.com/gtag/js?id=G-FBXJQQLXKD"></script>
  1142. <script>
  1143. const enableGtag = () => {
  1144. window.dataLayer = window.dataLayer || [];
  1145. function gtag(){dataLayer.push(arguments);}
  1146. gtag('js', new Date());
  1147. gtag('config', 'G-FBXJQQLXKD');
  1148. }
  1149. (() => {
  1150. if (!localStorage.getItem("acceptedCookieAlert")) {
  1151. const boxElem = document.createElement("div");
  1152. boxElem.classList.add("cookie-alert");
  1153. const containerElem = document.createElement("div");
  1154. containerElem.classList.add("cookie-alert__container");
  1155. const textElem = document.createElement("p");
  1156. textElem.innerHTML = `This page uses <a href="https://analytics.google.com/">
  1157. Google Analytics</a> to collect statistics.`;
  1158. containerElem.appendChild(textElem);
  1159. const declineBtn = Object.assign(document.createElement("button"),
  1160. {
  1161. innerText: "Deny",
  1162. className: "farama-btn cookie-alert__button",
  1163. id: "cookie-alert__decline",
  1164. }
  1165. );
  1166. declineBtn.addEventListener("click", () => {
  1167. localStorage.setItem("acceptedCookieAlert", false);
  1168. boxElem.remove();
  1169. });
  1170. const acceptBtn = Object.assign(document.createElement("button"),
  1171. {
  1172. innerText: "Allow",
  1173. className: "farama-btn cookie-alert__button",
  1174. id: "cookie-alert__accept",
  1175. }
  1176. );
  1177. acceptBtn.addEventListener("click", () => {
  1178. localStorage.setItem("acceptedCookieAlert", true);
  1179. boxElem.remove();
  1180. enableGtag();
  1181. });
  1182. containerElem.appendChild(declineBtn);
  1183. containerElem.appendChild(acceptBtn);
  1184. boxElem.appendChild(containerElem);
  1185. document.body.appendChild(boxElem);
  1186. } else if (localStorage.getItem("acceptedCookieAlert") === "true") {
  1187. enableGtag();
  1188. }
  1189. })()
  1190. </script>
  1191. <script src="../../../_static/documentation_options.js?v=7fa42598"></script>
  1192. <script src="../../../_static/doctools.js?v=888ff710"></script>
  1193. <script src="../../../_static/sphinx_highlight.js?v=dc90522c"></script>
  1194. <script src="../../../_static/scripts/furo.js?v=7660844c"></script>
  1195. <script>
  1196. const createProjectsList = (projects, displayImages) => {
  1197. const ulElem = Object.assign(document.createElement('ul'),
  1198. {
  1199. className:'farama-header-menu-list',
  1200. }
  1201. )
  1202. for (let project of projects) {
  1203. const liElem = document.createElement("li");
  1204. const aElem = Object.assign(document.createElement("a"),
  1205. {
  1206. href: project.link
  1207. }
  1208. );
  1209. liElem.appendChild(aElem);
  1210. if (displayImages) {
  1211. const imgElem = Object.assign(document.createElement("img"),
  1212. {
  1213. src: project.image ? imagesBasepath + project.image : imagesBasepath + "/farama_black.svg",
  1214. alt: `${project.name} logo`,
  1215. className: "farama-black-logo-invert"
  1216. }
  1217. );
  1218. aElem.appendChild(imgElem);
  1219. }
  1220. aElem.appendChild(document.createTextNode(project.name));
  1221. ulElem.appendChild(liElem);
  1222. }
  1223. return ulElem;
  1224. }
  1225. // Create menu with Farama projects by using the API at farama.org/api/projects.json
  1226. const createCORSRequest = (method, url) => {
  1227. let xhr = new XMLHttpRequest();
  1228. xhr.responseType = 'json';
  1229. if ("withCredentials" in xhr) {
  1230. xhr.open(method, url, true);
  1231. } else if (typeof XDomainRequest != "undefined") {
  1232. // IE8 & IE9
  1233. xhr = new XDomainRequest();
  1234. xhr.open(method, url);
  1235. } else {
  1236. // CORS not supported.
  1237. xhr = null;
  1238. }
  1239. return xhr;
  1240. };
  1241. const url = 'https://farama.org/api/projects.json';
  1242. const imagesBasepath = "https://farama.org/assets/images"
  1243. const method = 'GET';
  1244. let xhr = createCORSRequest(method, url);
  1245. xhr.onload = () => {
  1246. const jsonResponse = xhr.response;
  1247. const sections = {
  1248. "Core Projects": [],
  1249. "Mature Projects": {
  1250. "Documentation": [],
  1251. "Repositories": [],
  1252. },
  1253. "Incubating Projects": {
  1254. "Documentation": [],
  1255. "Repositories": [],
  1256. },
  1257. "Foundation": [
  1258. {
  1259. name: "About",
  1260. link: "https://farama.org/about"
  1261. },
  1262. {
  1263. name: "Standards",
  1264. link: "https://farama.org/project_standards",
  1265. },
  1266. {
  1267. name: "Donate",
  1268. link: "https://farama.org/donations"
  1269. }
  1270. ]
  1271. }
  1272. // Categorize projects
  1273. Object.keys(jsonResponse).forEach(key => {
  1274. projectJson = jsonResponse[key];
  1275. if (projectJson.website !== null) {
  1276. projectJson.link = projectJson.website;
  1277. } else {
  1278. projectJson.link = projectJson.github;
  1279. }
  1280. if (projectJson.type === "core") {
  1281. sections["Core Projects"].push(projectJson)
  1282. } else if (projectJson.type == "mature") {
  1283. if (projectJson.website !== null) {
  1284. sections["Mature Projects"]["Documentation"].push(projectJson)
  1285. } else {
  1286. sections["Mature Projects"]["Repositories"].push(projectJson)
  1287. }
  1288. } else {
  1289. if (projectJson.website !== null) {
  1290. sections["Incubating Projects"]["Documentation"].push(projectJson)
  1291. } else {
  1292. sections["Incubating Projects"]["Repositories"].push(projectJson)
  1293. }
  1294. }
  1295. })
  1296. const menuContainer = document.querySelector(".farama-header-menu__body");
  1297. Object.keys(sections).forEach((key, i) => {
  1298. const sectionElem = Object.assign(
  1299. document.createElement('div'), {
  1300. className:'farama-header-menu__section',
  1301. }
  1302. )
  1303. sectionElem.appendChild(Object.assign(document.createElement('span'),
  1304. {
  1305. className:'farama-header-menu__section-title' ,
  1306. innerText: key
  1307. }
  1308. ))
  1309. // is not a list
  1310. if (sections[key].constructor !== Array) {
  1311. const subSections = sections[key];
  1312. const subSectionContainerElem = Object.assign(
  1313. document.createElement('div'), {
  1314. className:'farama-header-menu__subsections-container',
  1315. style: 'display: flex'
  1316. }
  1317. )
  1318. Object.keys(subSections).forEach((subKey, i) => {
  1319. const subSectionElem = Object.assign(
  1320. document.createElement('div'), {
  1321. className:'farama-header-menu__subsection',
  1322. }
  1323. )
  1324. subSectionElem.appendChild(Object.assign(document.createElement('span'),
  1325. {
  1326. className:'farama-header-menu__subsection-title' ,
  1327. innerText: subKey
  1328. }
  1329. ))
  1330. const ulElem = createProjectsList(subSections[subKey], key !== 'Foundation');
  1331. subSectionElem.appendChild(ulElem);
  1332. subSectionContainerElem.appendChild(subSectionElem);
  1333. })
  1334. sectionElem.appendChild(subSectionContainerElem);
  1335. } else {
  1336. const projects = sections[key];
  1337. const ulElem = createProjectsList(projects, true);
  1338. sectionElem.appendChild(ulElem);
  1339. }
  1340. menuContainer.appendChild(sectionElem)
  1341. });
  1342. }
  1343. xhr.onerror = function() {
  1344. console.error("Unable to load projects");
  1345. };
  1346. xhr.send();
  1347. </script>
  1348. <script>
  1349. const versioningConfig = {
  1350. githubUser: 'Farama-Foundation',
  1351. githubRepo: 'Minigrid',
  1352. };
  1353. fetch('/main/_static/versioning/versioning_menu.html').then(response => {
  1354. if (response.status === 200) {
  1355. response.text().then(text => {
  1356. const container = document.createElement("div");
  1357. container.innerHTML = text;
  1358. document.querySelector("body").appendChild(container);
  1359. // innerHtml doenst evaluate scripts, we need to add them dynamically
  1360. Array.from(container.querySelectorAll("script")).forEach(oldScript => {
  1361. const newScript = document.createElement("script");
  1362. Array.from(oldScript.attributes).forEach(attr => newScript.setAttribute(attr.name, attr.value));
  1363. newScript.appendChild(document.createTextNode(oldScript.innerHTML));
  1364. oldScript.parentNode.replaceChild(newScript, oldScript);
  1365. });
  1366. });
  1367. } else {
  1368. console.warn("Unable to load versioning menu", response);
  1369. }
  1370. });
  1371. </script>
  1372. </body>
  1373. </html>