You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
More details about requirements graph can be found in the documentation at [`hcraft.requirements`](https://irll.github.io/HierarchyCraft/hcraft/requirements.html) and example of requirements graph for some HierarchyCraft environements can be found in [`hcraft.examples`](https://irll.github.io/HierarchyCraft/hcraft/examples.html).
author = {Maxime Chevalier{-}Boisvert and Bolun Dai and Mark Towers and Rodrigo Perez{-}Vicente and Lucas Willems and Salem Lahlou and Suman Pal and Pablo Samuel Castro and Jordan Terry},
40
+
title = {Minigrid {\&} Miniworld: Modular {\&} Customizable Reinforcement Learning Environments for Goal-Oriented Tasks},
41
+
booktitle = {Advances in Neural Information Processing Systems 36, New Orleans, LA, USA},
abstract = {In this report, we summarize the takeaways from the first NeurIPS 2021 NetHack Challenge. Participants were tasked with developing a program or agent that can win (i.e., ’ascend’ in) the popular dungeon-crawler game of NetHack by interacting with the NetHack Learning Environment (NLE), a scalable, procedurally generated, and challenging Gym environment for reinforcement learning (RL). The challenge showcased community-driven progress in AI with many diverse approaches significantly beating the previously best results on NetHack. Furthermore, it served as a direct comparison between neural (e.g., deep RL) and symbolic AI, as well as hybrid systems, demonstrating that on NetHack symbolic bots currently outperform deep RL by a large margin. Lastly, no agent got close to winning the game, illustrating NetHack’s suitability as a long-term benchmark for AI research.}
234
237
}
238
+
239
+
@article{botvinick2014model,
240
+
title={Model-based hierarchical reinforcement learning and human action control},
241
+
author={Botvinick, Matthew and Weinstein, Aaron},
242
+
journal={Philosophical Transactions of the Royal Society B: Biological Sciences},
243
+
volume={369},
244
+
number={1655},
245
+
pages={20130480},
246
+
year={2014},
247
+
publisher={The Royal Society}
248
+
}
249
+
250
+
@inproceedings{bacon2017option,
251
+
title={The option-critic architecture},
252
+
author={Bacon, Pierre-Luc and Harb, Mohamad and Precup, Doina},
253
+
booktitle={Proceedings of the AAAI Conference on Artificial Intelligence},
254
+
volume={31},
255
+
number={1},
256
+
year={2017}
257
+
}
258
+
259
+
@inproceedings{heess2016learning,
260
+
title={Learning continuous control policies by stochastic value gradients},
261
+
author={Heess, Nicolas and Wayne, Greg and Silver, David and Lillicrap, Timothy and Erez, Tom and Tassa, Yuval},
262
+
booktitle={Advances in Neural Information Processing Systems (NeurIPS)},
0 commit comments