@inproceedings{Jiao-po,
address = {Singapore},
author = {Fangkai Jiao and Geyang Guo and Xingxing Zhang and Nancy F. Chen and Shafiq Joty and Furu Wei},
booktitle = {International Conference on Learning Representations},
series = {ICLR-25 (spotlight)},
title = {Preference Optimization for Reasoning with Pseudo Feedback},
url = {https://arxiv.org/abs/2411.16345},
year = {2025}
}