@article{journals/corr/abs-2310-12773,
added-at = {2024-05-07T00:00:00.000+0200},
author = {Dai, Josef and Pan, Xuehai and Sun, Ruiyang and Ji, Jiaming and Xu, Xinbo and Liu, Mickel and Wang, Yizhou and Yang, Yaodong},
biburl = {https://www.bibsonomy.org/bibtex/2027db06d6055ab5c7115885fded30e1f/dblp},
ee = {https://doi.org/10.48550/arXiv.2310.12773},
interhash = {2cdf794a45f37789ac9843f59aef2bba},
intrahash = {027db06d6055ab5c7115885fded30e1f},
journal = {CoRR},
keywords = {dblp},
timestamp = {2024-05-13T07:38:08.000+0200},
title = {Safe RLHF: Safe Reinforcement Learning from Human Feedback.},
url = {http://dblp.uni-trier.de/db/journals/corr/corr2310.html#abs-2310-12773},
volume = {abs/2310.12773},
year = 2023
}