@article{wang2025unleashing,title={Unleashing the Reasoning Potential of Pre-trained LLMs by Critique Fine-Tuning on One Problem},author={Wang, Yubo and Nie, Ping and Zou, Kai and Wu, Lijun and Chen, Wenhu},booktitle={arxiv preprint},month=jun,year={2025},github={TIGER-AI-Lab/One-Shot-CFT},huggingface={https://huggingface.co/collections/TIGER-Lab/one-shot-cft-683fbb4d2bcf698dbea8fb21},twitter={https://x.com/YuboWang726/status/1930454445613088986},selected=true,num_co_first_author={1},}
COLM 2025
ScholarCopilot: Training Large Language Models for Academic Writing with Accurate Citations
Yubo Wang, Xueguang Ma, Ping Nie, and 7 more authors
@article{wang2025scholarcopilot,title={ScholarCopilot: Training Large Language Models for Academic Writing with Accurate Citations},author={Wang, Yubo and Ma, Xueguang and Nie, Ping and Zeng, Huaye and Lyu, Zhiheng and Zhang, Yuxuan and Schneider, Benjamin and Lu, Yi and Yue, Xiang and Chen, Wenhu},booktitle={2nd Conference on Language Modeling},month=apr,year={2025},github={TIGER-AI-Lab/ScholarCopilot},huggingface={https://huggingface.co/collections/TIGER-Lab/scholarcopilot-6756f940df88114b24232074},twitter={https://x.com/WenhuChen/status/1907861046833885397},selected=true,num_co_first_author={1},}
COLM 2025
Critique Fine-Tuning: Learning to Critique is More Effective than Learning to Imitate
@article{wang2025critique,title={Critique Fine-Tuning: Learning to Critique is More Effective than Learning to Imitate},author={Wang, Yubo and Yue, Xiang and Chen, Wenhu},booktitle={2nd Conference on Language Modeling},month=jan,year={2025},github={TIGER-AI-Lab/CritiqueFineTuning},huggingface={https://huggingface.co/collections/TIGER-Lab/critiquefinetuning-679b25e1528e75180f55e5c4},twitter={https://x.com/WenhuChen/status/1885060597500567562},selected=true,num_co_first_author={1},}
2024
Neurips 2024
MMLU-Pro: A More Robust and Challenging Multi-task Language Understanding Benchmark
Yubo Wang, Xueguang Ma, Ge Zhang, and 8 more authors
@article{wang2024mmlu,title={MMLU-Pro: A More Robust and Challenging Multi-task Language Understanding Benchmark},author={Wang, Yubo and Ma, Xueguang and Zhang, Ge and Ni, Yuansheng and Chandra, Abhranil and Guo, Shiguang and Ren, Weiming and Arulraj, Aaran and He, Xuan and Jiang, Ziyan and others},booktitle={Proceedings of NeurIPS 2024},month=jun,year={2024},github={TIGER-AI-Lab/MMLU-Pro},huggingface={https://huggingface.co/spaces/TIGER-Lab/MMLU-Pro},twitter={https://x.com/YuboWang726/status/1839330905145610688},selected=true,num_co_first_author={1},}