-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathworld-model-papers.bib
181 lines (162 loc) · 6.01 KB
/
world-model-papers.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
@incollection{ha2018worldmodels,
title = {Recurrent World Models Facilitate Policy Evolution},
author = {Ha, David and Schmidhuber, J{\"u}rgen},
booktitle = {Advances in Neural Information Processing Systems 31},
pages = {2451--2463},
year = {2018},
publisher = {Curran Associates, Inc.},
url = {https://papers.nips.cc/paper/7512-recurrent-world-models-facilitate-policy-evolution},
note = "\url{https://worldmodels.github.io}",
}
@article{learningtopredict2019,
author = {Freeman, C Daniel and Luke Metz and David Ha},
title = {Learning to Predict Without Looking Ahead: World Models Without Forward Prediction},
eprint = {arXiv:1910.13038},
url = {https://learningtopredict.github.io},
note = "\url{https://learningtopredict.github.io}",
year = {2019}
}
@misc{kipf2020contrastive,
title={Contrastive Learning of Structured World Models},
author={Thomas Kipf and Elise van der Pol and Max Welling},
year={2020},
eprint={1911.12247},
archivePrefix={arXiv},
primaryClass={stat.ML}
}
@misc{zhang2021world,
title={World Model as a Graph: Learning Latent Landmarks for Planning},
author={Lunjun Zhang and Ge Yang and Bradly C. Stadie},
year={2021},
eprint={2011.12491},
archivePrefix={arXiv},
primaryClass={cs.AI}
}
@inproceedings{
micheli2023transformers,
title={Transformers are Sample-Efficient World Models},
author={Vincent Micheli and Eloi Alonso and Fran{\c{c}}ois Fleuret},
booktitle={The Eleventh International Conference on Learning Representations },
year={2023},
url={https://openreview.net/forum?id=vhFu1Acb0xb}
}
@misc{hafner2020dream,
title={Dream to Control: Learning Behaviors by Latent Imagination},
author={Danijar Hafner and Timothy Lillicrap and Jimmy Ba and Mohammad Norouzi},
year={2020},
eprint={1912.01603},
archivePrefix={arXiv},
primaryClass={cs.LG}
}
@misc{hafner2022mastering,
title={Mastering Atari with Discrete World Models},
author={Danijar Hafner and Timothy Lillicrap and Mohammad Norouzi and Jimmy Ba},
year={2022},
eprint={2010.02193},
archivePrefix={arXiv},
primaryClass={cs.LG}
}
@misc{chen2022transdreamer,
title={TransDreamer: Reinforcement Learning with Transformer World Models},
author={Chang Chen and Yi-Fu Wu and Jaesik Yoon and Sungjin Ahn},
year={2022},
eprint={2202.09481},
archivePrefix={arXiv},
primaryClass={cs.LG}
}
@misc{hafner2023mastering,
title={Mastering Diverse Domains through World Models},
author={Danijar Hafner and Jurgis Pasukonis and Jimmy Ba and Timothy Lillicrap},
year={2023},
eprint={2301.04104},
archivePrefix={arXiv},
primaryClass={cs.AI}
}
@misc{cowenrivers2020emergent,
title={Emergent Communication with World Models},
author={Alexander I. Cowen-Rivers and Jason Naradowsky},
year={2020},
eprint={2002.09604},
archivePrefix={arXiv},
primaryClass={cs.CL}
}
@misc{nottingham2023embodied,
title={Do Embodied Agents Dream of Pixelated Sheep: Embodied Decision Making using Language Guided World Modelling},
author={Kolby Nottingham and Prithviraj Ammanabrolu and Alane Suhr and Yejin Choi and Hannaneh Hajishirzi and Sameer Singh and Roy Fox},
year={2023},
eprint={2301.12050},
archivePrefix={arXiv},
primaryClass={cs.LG}
}
@misc{hao2023reasoning,
title={Reasoning with Language Model is Planning with World Model},
author={Shibo Hao and Yi Gu and Haodi Ma and Joshua Jiahua Hong and Zhen Wang and Daisy Zhe Wang and Zhiting Hu},
year={2023},
eprint={2305.14992},
archivePrefix={arXiv},
primaryClass={cs.CL}
}
@misc{wang2023voyager,
title={Voyager: An Open-Ended Embodied Agent with Large Language Models},
author={Guanzhi Wang and Yuqi Xie and Yunfan Jiang and Ajay Mandlekar and Chaowei Xiao and Yuke Zhu and Linxi Fan and Anima Anandkumar},
year={2023},
eprint={2305.16291},
archivePrefix={arXiv},
primaryClass={cs.AI}
}
@misc{xu2022learning,
title={Learning General World Models in a Handful of Reward-Free Deployments},
author={Yingchen Xu and Jack Parker-Holder and Aldo Pacchiano and Philip J. Ball and Oleh Rybkin and Stephen J. Roberts and Tim Rocktäschel and Edward Grefenstette},
year={2022},
eprint={2210.12719},
archivePrefix={arXiv},
primaryClass={cs.LG}
}
@misc{koh2021pathdreamer,
title={Pathdreamer: A World Model for Indoor Navigation},
author={Jing Yu Koh and Honglak Lee and Yinfei Yang and Jason Baldridge and Peter Anderson},
year={2021},
eprint={2105.08756},
archivePrefix={arXiv},
primaryClass={cs.CV}
}
@misc{seo2023masked,
title={Masked World Models for Visual Control},
author={Younggyo Seo and Danijar Hafner and Hao Liu and Fangchen Liu and Stephen James and Kimin Lee and Pieter Abbeel},
year={2023},
eprint={2206.14244},
archivePrefix={arXiv},
primaryClass={cs.RO}
}
@misc{poudel2023langwm,
title={LanGWM: Language Grounded World Model},
author={Rudra P. K. Poudel and Harit Pandya and Chao Zhang and Roberto Cipolla},
year={2023},
eprint={2311.17593},
archivePrefix={arXiv},
primaryClass={cs.LG}
}
@misc{lin2023learning,
title={Learning to Model the World with Language},
author={Jessy Lin and Yuqing Du and Olivia Watkins and Danijar Hafner and Pieter Abbeel and Dan Klein and Anca Dragan},
year={2023},
eprint={2308.01399},
archivePrefix={arXiv},
primaryClass={cs.CL}
}
@misc{deng2023facing,
title={Facing Off World Model Backbones: RNNs, Transformers, and S4},
author={Fei Deng and Junyeong Park and Sungjin Ahn},
year={2023},
eprint={2307.02064},
archivePrefix={arXiv},
primaryClass={cs.LG}
}
@misc{zhang2024languageguided,
title={Language-Guided World Models: A Model-Based Approach to AI Control},
author={Alex Zhang and Khanh Nguyen and Jens Tuyls and Albert Lin and Karthik Narasimhan},
year={2024},
eprint={2402.01695},
archivePrefix={arXiv},
primaryClass={cs.CL}
}