Open problems and fundamental limitations of reinforcement learning from human feedback
Fields with differences: venue. Compare local vs external BibTeX below.
Authors
Venue
Transactions on Machine Learning Research (TMLR)
Links
BibTeX
Local Entry
@article{casper2023,
title = {Open problems and fundamental limitations of reinforcement learning from human feedback},
author = {Stephen Casper and Xander Davies and Claudia Shi and Thomas Krendl Gilbert and J'er'emy Scheurer and Javier Rando and Rachel Freedman and Tomasz Korbak and David Lindner and Pedro Freire},
year = {2023},
journal = {Transactions on Machine Learning Research (TMLR)},
url = {https://openreview.net/forum?id=bx24KpJ4Eb}
} From AUTO:OPENALEX
@article{casper2023,
title = {Open Problems and Fundamental Limitations of Reinforcement Learning from Human Feedback},
author = {Stephen Casper and Xander Davies and Claudia Shi and Thomas Krendl Gilbert and Jérémy Scheurer and Javier Rando and Rachel Freedman and Tomasz Korbak and David Lindner and Pedro J. Freire and Tony Wang and Samuel D. Marks and Charbel-Raphaël Ségerie and Micah Carroll and Andi Peng and Phillip Christoffersen and Mehul Damani and Stewart Slocum and Anwar Usman and Anand Siththaranjan and Max Nadeau and Eric J. Michaud and Jacob Pfau and Dmitrii Krasheninnikov and Xin Chen and Lauro Langosco and Peter Hase and Erdem Bıyık and Anca D. Dragan and David Krueger and Dorsa Sadigh and Dylan Hadfield-Menell},
year = {2023},
journal = {arXiv (Cornell University)},
doi = {10.48550/arxiv.2307.15217}
}