@article{journals/corr/abs-2403-10704,
added-at = {2024-04-08T00:00:00.000+0200},
author = {Sidahmed, Hakim and Phatale, Samrat and Hutcheson, Alex and Lin, Zhuonan and Chen, Zhang and Yu, Zac and Jin, Jarvis and Komarytsia, Roman and Ahlheim, Christiane and Zhu, Yonghao and Chaudhary, Simral and Li, Bowen and Ganesh, Saravanan and Byrne, Bill and Hoffmann, Jessica and Mansoor, Hassan and Li, Wei and Rastogi, Abhinav and Dixon, Lucas},
biburl = {https://www.bibsonomy.org/bibtex/2d5cc78a30f7062225cbd45a2440355bd/dblp},
ee = {https://doi.org/10.48550/arXiv.2403.10704},
interhash = {f8cf1c9bce047c83de2dbb2e7e323efc},
intrahash = {d5cc78a30f7062225cbd45a2440355bd},
journal = {CoRR},
keywords = {dblp},
timestamp = {2024-04-12T14:38:23.000+0200},
title = {PERL: Parameter Efficient Reinforcement Learning from Human Feedback.},
url = {http://dblp.uni-trier.de/db/journals/corr/corr2403.html#abs-2403-10704},
volume = {abs/2403.10704},
year = 2024
}