@inproceedings{NeurIPS:2025:Wang:B,

author = {Yibo Wang and Hai-Long Sun and Guangda Huzhang and Qing-Guo Chen and Zhao Xu and Weihua Luo and Kaifu Zhang and Lijun Zhang},

title = {Triplets Better Than Pairs: Towards Stable and Effective Self-Play Fine-Tuning for LLMs},

booktitle = {In Advances in Neural Information Processing Systems 38 (NeurIPS 2025)},

pages = {},

year = {2025},

}