From Data to Rewards: a Bilevel Optimization Perspective on Maximum Likelihood Estimation
BibTex
Copy
@misc{benechehabWed Oct 08 2025 23:45:37 GMT+0000 (Coordinated Universal Time)datarewardsbilevel,
title={From Data to Rewards: a Bilevel Optimization Perspective on Maximum Likelihood Estimation},
author={Abdelhakim Benechehab and Gabriel Singer and Corentin Léger and Youssef Attia El Hili and Giuseppe Paolo and Albert Thomas and Maurizio Filippone and Balázs Kégl},
year={Wed Oct 08 2025 23:45:37 GMT+0000 (Coordinated Universal Time)},
eprint={2510.07624},
archivePrefix={arXiv},
primaryClass={cs.LG},
url={https://arxiv.org/abs/2510.07624},
}