@article{
fisch2025robust,
title={Robust Preference Optimization through Reward Model Distillation},
author={Adam Fisch and Jacob Eisenstein and Vicky Zayats and Alekh Agarwal and Ahmad Beirami and Chirag Nagpal and Peter Shaw and Jonathan Berant},
journal={Transactions on Machine Learning Research},
issn={2835-8856},
year={2025},
url={https://openreview.net/forum?id=E2zKNuwNDc},
note={}
}