SRPO: Self-Referential Policy Optimization for Vision-Language-Action Models
BibTex
Copy
@misc{feiWed Nov 19 2025 16:52:23 GMT+0000 (Coordinated Universal Time)srposelfreferentialpolicy,
title={SRPO: Self-Referential Policy Optimization for Vision-Language-Action Models},
author={Senyu Fei and Siyin Wang and Li Ji and Ao Li and Shiduo Zhang and Liming Liu and Jinlong Hou and Jingjing Gong and Xianzhong Zhao and Xipeng Qiu},
year={Wed Nov 19 2025 16:52:23 GMT+0000 (Coordinated Universal Time)},
eprint={2511.15605},
archivePrefix={arXiv},
primaryClass={cs.CL},
url={https://arxiv.org/abs/2511.15605},
}