Training language models to follow instructions with human feedback
Authors
Venue
arXiv preprint arXiv:2203.02155
Tags
Links
BibTeX
Local Entry
@article{ouyang2022instructgpt,
title = {Training language models to follow instructions with human feedback},
author = {Long Ouyang and Jeff Wu and Xu Jiang and Diogo Almeida and Carroll L. Wainwright and Pamela Mishkin and Chong Zhang and Sandhini Agarwal and Katarina Slama and Alex Ray and John Schulman and Jacob Hilton and Fraser Kelton and Luke Miller and Maddie Simens and Amanda Askell and Peter Welinder and Paul Christiano and Jan Leike and Ryan Lowe},
year = {2022},
journal = {arXiv preprint arXiv:2203.02155},
url = {https://arxiv.org/abs/2203.02155}
} From OPENALEX
@article{ouyang2022instructgpt,
title = {Training language models to follow instructions with human feedback},
author = {Long Ouyang and Jeff Wu and Xu Jiang and Diogo Almeida and Carroll L. Wainwright and Pamela Mishkin and Chong Zhang and Sandhini Agarwal and Katarina Slama and Alex Ray and John Schulman and Jacob Hilton and Fraser Kelton and Luke E. Miller and Maddie Simens and Amanda Askell and Peter Welinder and Paul Christiano and Jan Leike and Ryan Lowe},
year = {2022},
journal = {arXiv (Cornell University)},
doi = {10.48550/arxiv.2203.02155}
}