Deep reinforcement learning from human preferences
Authors
Venue
Advances in neural information processing systems
BibTeX
Local Entry
@inproceedings{christiano2017,
title = {Deep reinforcement learning from human preferences},
author = {Paul F Christiano and Jan Leike and Tom Brown and Miljan Martic and Shane Legg and Dario Amodei},
year = {2017},
booktitle = {Advances in neural information processing systems}
} From AUTO:OPENALEX
@inproceedings{christiano2017,
title = {Deep reinforcement learning from human preferences},
author = {Paul F. Christiano and Jan Leike and T. B. Brown and Miljan Martic and Shane Legg and Dario Amodei},
year = {2017},
booktitle = {arXiv (Cornell University)},
doi = {10.48550/arxiv.1706.03741}
}