RLPR: Extrapolating RLVR to General Domains without Verifiers
BibTex
Copy
@misc{liu2025rlprextrapolatingrlvr,
title={RLPR: Extrapolating RLVR to General Domains without Verifiers},
author={Zhiyuan Liu and Maosong Sun and Ganqu Cui and Yuan Yao and Ning Ding and Tat-Seng Chua and Lifan Yuan and Tianyu Yu and Bo Ji and Zefan Wang and Shouli Wang and Shu Yao},
year={2025},
eprint={2506.18254},
archivePrefix={arXiv},
primaryClass={cs.LG},
url={https://arxiv.org/abs/2506.18254},
}