@Article{Xu2024IsDS,
author = {Shusheng Xu and Wei Fu and Jiaxuan Gao and Wenjie Ye and Weiling Liu and Zhiyu Mei and Guangju Wang and Chao Yu and Yi Wu},
booktitle = {International Conference on Machine Learning},
journal = {ArXiv},
title = {Is DPO Superior to PPO for LLM Alignment? A Comprehensive Study},
volume = {abs/2404.10719},
year = {2024}
}