Data Leverage References

← Back to browse

Training language models to follow instructions with human feedback

2022 article ouyang2022instructgpt Not yet verified
Authors
Long Ouyang, Jeff Wu, Xu Jiang, Diogo Almeida, Carroll L. Wainwright, Pamela Mishkin, Chong Zhang, Sandhini Agarwal, Katarina Slama, Alex Ray, John Schulman, Jacob Hilton, Fraser Kelton, Luke Miller, Maddie Simens, Amanda Askell, Peter Welinder, Paul Christiano, Jan Leike, Ryan Lowe
Venue
arXiv preprint arXiv:2203.02155

BibTeX

Local Entry
@article{ouyang2022instructgpt,
  title = {Training language models to follow instructions with human feedback},
  author = {Long Ouyang and Jeff Wu and Xu Jiang and Diogo Almeida and Carroll L. Wainwright and Pamela Mishkin and Chong Zhang and Sandhini Agarwal and Katarina Slama and Alex Ray and John Schulman and Jacob Hilton and Fraser Kelton and Luke Miller and Maddie Simens and Amanda Askell and Peter Welinder and Paul Christiano and Jan Leike and Ryan Lowe},
  year = {2022},
  journal = {arXiv preprint arXiv:2203.02155},
  url = {https://arxiv.org/abs/2203.02155}
}
From OPENALEX
@article{ouyang2022instructgpt,
  title = {Training language models to follow instructions with human feedback},
  author = {Long Ouyang and Jeff Wu and Xu Jiang and Diogo Almeida and Carroll L. Wainwright and Pamela Mishkin and Chong Zhang and Sandhini Agarwal and Katarina Slama and Alex Ray and John Schulman and Jacob Hilton and Fraser Kelton and Luke E. Miller and Maddie Simens and Amanda Askell and Peter Welinder and Paul Christiano and Jan Leike and Ryan Lowe},
  year = {2022},
  journal = {arXiv (Cornell University)},
  doi = {10.48550/arxiv.2203.02155}
}