@article{
kong2025qpo,
title={{QPO}: Query-dependent Prompt Optimization via Multi-Loop Offline Reinforcement Learning},
author={Yilun Kong and Hangyu Mao and Zhao Qi and Bin Zhang and Jingqing Ruan and Li Shen and Yongzhe Chang and Xueqian Wang and Rui Zhao and Dacheng Tao},
journal={Transactions on Machine Learning Research},
issn={2835-8856},
year={2025},
url={https://openreview.net/forum?id=bqMJToTkvT},
note={}
}