@inproceedings{NeurIPS:2025:Wang:A
author = {Yibo Wang and Hai-Long Sun and Guangda Huzhang and Qing-Guo Chen and Zhao Xu and Weihua Luo and Kaifu Zhang and Lijun Zhang},
title = {Triplets Better Than Pairs: Towards Stable and Effective Self-Play Fine-Tuning for LLMs},
booktitle = {Advances in Neural Information Processing Systems 38 (NeurIPS)},
pages = {40980--41009},
year = {2025},
}