world-model-papers.bib

@incollection{ha2018worldmodels,
    title = {Recurrent World Models Facilitate Policy Evolution},
    author = {Ha, David and Schmidhuber, J{\"u}rgen},
    booktitle = {Advances in Neural Information Processing Systems 31},
    pages = {2451--2463},
    year = {2018},
    publisher = {Curran Associates, Inc.},
    url = {https://papers.nips.cc/paper/7512-recurrent-world-models-facilitate-policy-evolution},
    note = "\url{https://worldmodels.github.io}",
}

@article{learningtopredict2019,
    author = {Freeman, C Daniel and Luke Metz and David Ha},
    title  = {Learning to Predict Without Looking Ahead: World Models Without Forward Prediction},
    eprint = {arXiv:1910.13038},
    url    = {https://learningtopredict.github.io},
    note   = "\url{https://learningtopredict.github.io}",
    year   = {2019}
}

@misc{kipf2020contrastive,
    title={Contrastive Learning of Structured World Models}, 
    author={Thomas Kipf and Elise van der Pol and Max Welling},
    year={2020},
    eprint={1911.12247},
    archivePrefix={arXiv},
    primaryClass={stat.ML}
}

@misc{zhang2021world,
    title={World Model as a Graph: Learning Latent Landmarks for Planning}, 
    author={Lunjun Zhang and Ge Yang and Bradly C. Stadie},
    year={2021},
    eprint={2011.12491},
    archivePrefix={arXiv},
    primaryClass={cs.AI}
}

@inproceedings{
    micheli2023transformers,
    title={Transformers are Sample-Efficient World Models},
    author={Vincent Micheli and Eloi Alonso and Fran{\c{c}}ois Fleuret},
    booktitle={The Eleventh International Conference on Learning Representations },
    year={2023},
    url={https://openreview.net/forum?id=vhFu1Acb0xb}
}

@misc{hafner2020dream,
    title={Dream to Control: Learning Behaviors by Latent Imagination}, 
    author={Danijar Hafner and Timothy Lillicrap and Jimmy Ba and Mohammad Norouzi},
    year={2020},
    eprint={1912.01603},
    archivePrefix={arXiv},
    primaryClass={cs.LG}
}

@misc{hafner2022mastering,
    title={Mastering Atari with Discrete World Models}, 
    author={Danijar Hafner and Timothy Lillicrap and Mohammad Norouzi and Jimmy Ba},
    year={2022},
    eprint={2010.02193},
    archivePrefix={arXiv},
    primaryClass={cs.LG}
}

@misc{chen2022transdreamer,
    title={TransDreamer: Reinforcement Learning with Transformer World Models}, 
    author={Chang Chen and Yi-Fu Wu and Jaesik Yoon and Sungjin Ahn},
    year={2022},
    eprint={2202.09481},
    archivePrefix={arXiv},
    primaryClass={cs.LG}
}

@misc{hafner2023mastering,
    title={Mastering Diverse Domains through World Models}, 
    author={Danijar Hafner and Jurgis Pasukonis and Jimmy Ba and Timothy Lillicrap},
    year={2023},
    eprint={2301.04104},
    archivePrefix={arXiv},
    primaryClass={cs.AI}
}

@misc{cowenrivers2020emergent,
    title={Emergent Communication with World Models}, 
    author={Alexander I. Cowen-Rivers and Jason Naradowsky},
    year={2020},
    eprint={2002.09604},
    archivePrefix={arXiv},
    primaryClass={cs.CL}
}

@misc{nottingham2023embodied,
    title={Do Embodied Agents Dream of Pixelated Sheep: Embodied Decision Making using Language Guided World Modelling}, 
    author={Kolby Nottingham and Prithviraj Ammanabrolu and Alane Suhr and Yejin Choi and Hannaneh Hajishirzi and Sameer Singh and Roy Fox},
    year={2023},
    eprint={2301.12050},
    archivePrefix={arXiv},
    primaryClass={cs.LG}
}

@misc{hao2023reasoning,
    title={Reasoning with Language Model is Planning with World Model}, 
    author={Shibo Hao and Yi Gu and Haodi Ma and Joshua Jiahua Hong and Zhen Wang and Daisy Zhe Wang and Zhiting Hu},
    year={2023},
    eprint={2305.14992},
    archivePrefix={arXiv},
    primaryClass={cs.CL}
}

@misc{wang2023voyager,
    title={Voyager: An Open-Ended Embodied Agent with Large Language Models}, 
    author={Guanzhi Wang and Yuqi Xie and Yunfan Jiang and Ajay Mandlekar and Chaowei Xiao and Yuke Zhu and Linxi Fan and Anima Anandkumar},
    year={2023},
    eprint={2305.16291},
    archivePrefix={arXiv},
    primaryClass={cs.AI}
}

@misc{xu2022learning,
    title={Learning General World Models in a Handful of Reward-Free Deployments}, 
    author={Yingchen Xu and Jack Parker-Holder and Aldo Pacchiano and Philip J. Ball and Oleh Rybkin and Stephen J. Roberts and Tim Rocktäschel and Edward Grefenstette},
    year={2022},
    eprint={2210.12719},
    archivePrefix={arXiv},
    primaryClass={cs.LG}
}

@misc{koh2021pathdreamer,
    title={Pathdreamer: A World Model for Indoor Navigation}, 
    author={Jing Yu Koh and Honglak Lee and Yinfei Yang and Jason Baldridge and Peter Anderson},
    year={2021},
    eprint={2105.08756},
    archivePrefix={arXiv},
    primaryClass={cs.CV}
}

@misc{seo2023masked,
    title={Masked World Models for Visual Control}, 
    author={Younggyo Seo and Danijar Hafner and Hao Liu and Fangchen Liu and Stephen James and Kimin Lee and Pieter Abbeel},
    year={2023},
    eprint={2206.14244},
    archivePrefix={arXiv},
    primaryClass={cs.RO}
}

@misc{poudel2023langwm,
      title={LanGWM: Language Grounded World Model}, 
      author={Rudra P. K. Poudel and Harit Pandya and Chao Zhang and Roberto Cipolla},
      year={2023},
      eprint={2311.17593},
      archivePrefix={arXiv},
      primaryClass={cs.LG}
}

@misc{lin2023learning,
      title={Learning to Model the World with Language}, 
      author={Jessy Lin and Yuqing Du and Olivia Watkins and Danijar Hafner and Pieter Abbeel and Dan Klein and Anca Dragan},
      year={2023},
      eprint={2308.01399},
      archivePrefix={arXiv},
      primaryClass={cs.CL}
}

@misc{deng2023facing,
      title={Facing Off World Model Backbones: RNNs, Transformers, and S4}, 
      author={Fei Deng and Junyeong Park and Sungjin Ahn},
      year={2023},
      eprint={2307.02064},
      archivePrefix={arXiv},
      primaryClass={cs.LG}
}

@misc{zhang2024languageguided,
      title={Language-Guided World Models: A Model-Based Approach to AI Control}, 
      author={Alex Zhang and Khanh Nguyen and Jens Tuyls and Albert Lin and Karthik Narasimhan},
      year={2024},
      eprint={2402.01695},
      archivePrefix={arXiv},
      primaryClass={cs.CL}
}