@misc{lambert2023entangled,
title={Entangled Preferences: The History and Risks of Reinforcement Learning and Human Feedback},
author={Nathan Lambert and Thomas Krendl Gilbert and Tom Zick},
year={2023},
eprint={2310.13595},
archivePrefix={arXiv},
primaryClass={cs.CY}
}