@misc{Jiao-po,
archiveprefix = {arXiv},
author = {Fangkai Jiao and Geyang Guo and Xingxing Zhang and Nancy F. Chen and Shafiq Joty and Furu Wei},
eprint = {2411.16345},
primaryclass = {cs.CL},
title = {Preference Optimization for Reasoning with Pseudo Feedback},
url = {https://arxiv.org/abs/2411.16345},
year = {2024}
}