@inproceedings{jiang2026xskill,title={XSkill: Continual Learning from Experience and Skills in Multimodal Agents},author={Jiang, Guanyu and Su, Zhaochen and Qu, Xiaoye and Fung, Yi R. (May)},booktitle={International Conference on Machine Learning (ICML)},year={2026},github_repo={XSkill-Agent/XSkill},}
arXiv
AgentVista: Evaluating Multimodal Agents in Ultra-Challenging Realistic Visual Scenarios
Zhaochen Su, Jincheng Gao, Hangyu Guo, Zhenhua Liu, Lueyang Zhang, Xinyu Geng, Shijue Huang, Peng Xia, Guanyu Jiang, Cheng Wang, Yue Zhang, Yi R. (May) Fung, and Junxian He
@article{su2026agentvista,title={AgentVista: Evaluating Multimodal Agents in Ultra-Challenging Realistic Visual Scenarios},author={Su, Zhaochen and Gao, Jincheng and Guo, Hangyu and Liu, Zhenhua and Zhang, Lueyang and Geng, Xinyu and Huang, Shijue and Xia, Peng and Jiang, Guanyu and Wang, Cheng and Zhang, Yue and Fung, Yi R. (May) and He, Junxian},journal={arXiv preprint arXiv:2602.23166},year={2026},github_repo={hkust-nlp/AgentVista},}
ICLR 2026
The Tool Decathlon: Benchmarking Language Agents for Diverse, Realistic, and Long-Horizon Task Execution
Junlong Li, Wenshuo Zhao, Jian Zhao, Weihao Zeng, Haoze Wu, Xiaochen Wang, Rui Ge, Yuxuan Cao, Yuzhen Huang, Wei Liu, Junteng Liu, Zhaochen Su, Yiyang Guo, Fan Zhou, Lueyang Zhang, Juan Michelini, Xingyao Wang, Xiang Yue, Shuyan Zhou, Graham Neubig, and Junxian He
In International Conference on Learning Representations (ICLR), 2026
@inproceedings{li2026toolathlon,title={The Tool Decathlon: Benchmarking Language Agents for Diverse, Realistic, and Long-Horizon Task Execution},author={Li, Junlong and Zhao, Wenshuo and Zhao, Jian and Zeng, Weihao and Wu, Haoze and Wang, Xiaochen and Ge, Rui and Cao, Yuxuan and Huang, Yuzhen and Liu, Wei and Liu, Junteng and Su, Zhaochen and Guo, Yiyang and Zhou, Fan and Zhang, Lueyang and Michelini, Juan and Wang, Xingyao and Yue, Xiang and Zhou, Shuyan and Neubig, Graham and He, Junxian},booktitle={International Conference on Learning Representations (ICLR)},year={2026},github_repo={hkust-nlp/Toolathlon},}
ICLR 2026
GRACE: Generative Representation Learning via Contrastive Policy Optimization
Jiashuo Sun, Shixuan Liu, Zhaochen Su, Xianrui Zhong, Pengcheng Jiang, Bowen Jin, Peiran Li, Weijia Shi, and Jiawei Han
In International Conference on Learning Representations (ICLR), 2026
@inproceedings{sun2026grace,title={GRACE: Generative Representation Learning via Contrastive Policy Optimization},author={Sun, Jiashuo and Liu, Shixuan and Su, Zhaochen and Zhong, Xianrui and Jiang, Pengcheng and Jin, Bowen and Li, Peiran and Shi, Weijia and Han, Jiawei},booktitle={International Conference on Learning Representations (ICLR)},year={2026},github_repo={GasolSun36/GRACE},}
ICLR 2026
Advancing Multimodal Reasoning: From Optimized Cold Start to Staged Reinforcement Learning
@inproceedings{chen2026advancing,title={Advancing Multimodal Reasoning: From Optimized Cold Start to Staged Reinforcement Learning},author={Chen, Shuang and Guo, Yue and Su, Zhaochen and Li, Yafu and Wu, Yulun and Chen, Jiacheng and Chen, Jiayu and Wang, Weijie and Qu, Xiaoye and Cheng, Yu},booktitle={International Conference on Learning Representations (ICLR)},year={2026},github_repo={CSfufu/Revisual-R1},}
2025
arXiv
Thinking with Images for Multimodal Reasoning: Foundations, Methods, and Future Frontiers
Zhaochen Su, Peng Xia, Hangyu Guo, Zhenhua Liu, Yan Ma, Xiaoye Qu, Jiaqi Liu, Yanshu Li, Kaide Zeng, Zhengyuan Yang, Linjie Li, Yu Cheng, Heng Ji, Junxian He, and Yi R. Fung
@article{su2025thinking,title={Thinking with Images for Multimodal Reasoning: Foundations, Methods, and Future Frontiers},author={Su, Zhaochen and Xia, Peng and Guo, Hangyu and Liu, Zhenhua and Ma, Yan and Qu, Xiaoye and Liu, Jiaqi and Li, Yanshu and Zeng, Kaide and Yang, Zhengyuan and Li, Linjie and Cheng, Yu and Ji, Heng and He, Junxian and Fung, Yi R.},journal={arXiv preprint arXiv:2506.23918},year={2025},github_repo={zhaochen0110/Awesome_Think_With_Images},}
arXiv
OpenThinkIMG: Learning to Think with Images via Visual Tool Reinforcement Learning
Zhaochen Su, Linjie Li, Mingyang Song, Yunzhuo Hao, Zhengyuan Yang, Jun Zhang, Guanjie Chen, Jiawei Gu, Juntao Li, Xiaoye Qu, and Yu Cheng
@article{su2025openthinkimg,title={OpenThinkIMG: Learning to Think with Images via Visual Tool Reinforcement Learning},author={Su, Zhaochen and Li, Linjie and Song, Mingyang and Hao, Yunzhuo and Yang, Zhengyuan and Zhang, Jun and Chen, Guanjie and Gu, Jiawei and Li, Juntao and Qu, Xiaoye and Cheng, Yu},journal={arXiv preprint arXiv:2505.08617},year={2025},github_repo={zhaochen0110/OpenThinkIMG},}
ACL 2025
PRMBench: A Fine-grained and Challenging Benchmark for Process-Level Reward Models
Mingyang Song, Zhaochen Su, Xiaoye Qu, Jiawei Zhou, and Yu Cheng
In Annual Meeting of the Association for Computational Linguistics (ACL), 2025
@inproceedings{song2025prmbench,title={PRMBench: A Fine-grained and Challenging Benchmark for Process-Level Reward Models},author={Song, Mingyang and Su, Zhaochen and Qu, Xiaoye and Zhou, Jiawei and Cheng, Yu},booktitle={Annual Meeting of the Association for Computational Linguistics (ACL)},year={2025},github_repo={ssmisya/PRMBench},}
2024
NeurIPS 2024
ConflictBank: A Benchmark for Evaluating Knowledge Conflicts in Large Language Models
Zhaochen Su, Jun Zhang, Xiaoye Qu, Tong Zhu, Yanshu Li, Jiashuo Sun, Juntao Li, Min Zhang, and Yu Cheng
In Advances in Neural Information Processing Systems (NeurIPS), 2024
@inproceedings{su2024conflictbank,title={ConflictBank: A Benchmark for Evaluating Knowledge Conflicts in Large Language Models},author={Su, Zhaochen and Zhang, Jun and Qu, Xiaoye and Zhu, Tong and Li, Yanshu and Sun, Jiashuo and Li, Juntao and Zhang, Min and Cheng, Yu},booktitle={Advances in Neural Information Processing Systems (NeurIPS)},year={2024},github_repo={zhaochen0110/conflictbank},}
COLM 2024
Timo: Towards Better Temporal Reasoning for Language Models
Zhaochen Su, Jun Zhang, Tong Zhu, Xiaoye Qu, Juntao Li, Min Zhang, and Yu Cheng
@inproceedings{su2024timo,title={Timo: Towards Better Temporal Reasoning for Language Models},author={Su, Zhaochen and Zhang, Jun and Zhu, Tong and Qu, Xiaoye and Li, Juntao and Zhang, Min and Cheng, Yu},booktitle={Conference on Language Modeling (COLM)},year={2024},github_repo={zhaochen0110/Timo},}
ACL 2024
Living in the Moment: Can Large Language Models Grasp Co-Temporal Reasoning?
Zhaochen Su, Juntao Li, Jun Zhang, Tong Zhu, Xiaoye Qu, Pan Zhou, Yan Bowen, Yu Cheng, and Min Zhang
In Annual Meeting of the Association for Computational Linguistics (ACL), 2024
@inproceedings{su2024living,title={Living in the Moment: Can Large Language Models Grasp Co-Temporal Reasoning?},author={Su, Zhaochen and Li, Juntao and Zhang, Jun and Zhu, Tong and Qu, Xiaoye and Zhou, Pan and Bowen, Yan and Cheng, Yu and Zhang, Min},booktitle={Annual Meeting of the Association for Computational Linguistics (ACL)},year={2024},github_repo={zhaochen0110/Cotempqa},}
EMNLP 2024
SURf: Teaching Large Vision-Language Models to Selectively Utilize Retrieved Information
Jiashuo Sun, Jihai Zhang, Yucheng Zhou, Zhaochen Su, Xiaoye Qu, and Yu Cheng
In Conference on Empirical Methods in Natural Language Processing (EMNLP), 2024
@inproceedings{sun2024surf,title={SURf: Teaching Large Vision-Language Models to Selectively Utilize Retrieved Information},author={Sun, Jiashuo and Zhang, Jihai and Zhou, Yucheng and Su, Zhaochen and Qu, Xiaoye and Cheng, Yu},booktitle={Conference on Empirical Methods in Natural Language Processing (EMNLP)},year={2024},github_repo={GasolSun36/SURf},}
2023
EMNLP 2023
Efficient Continue Training of Temporal Language Model with Structural Information
Zhaochen Su, Juntao Li, Zikang Zhang, Zihan Zhou, and Min Zhang
In Findings of the Association for Computational Linguistics: EMNLP 2023, 2023
@inproceedings{su2023efficient,title={Efficient Continue Training of Temporal Language Model with Structural Information},author={Su, Zhaochen and Li, Juntao and Zhang, Zikang and Zhou, Zihan and Zhang, Min},booktitle={Findings of the Association for Computational Linguistics: EMNLP 2023},year={2023},}
2022
EMNLP 2022
Improving Temporal Generalization of Pre-trained Language Models with Lexical Semantic Change
Zhaochen Su, Zecheng Tang, Xinyan Guan, Lijun Wu, Min Zhang, and Juntao Li
In Conference on Empirical Methods in Natural Language Processing (EMNLP), 2022
@inproceedings{su2022improving,title={Improving Temporal Generalization of Pre-trained Language Models with Lexical Semantic Change},author={Su, Zhaochen and Tang, Zecheng and Guan, Xinyan and Wu, Lijun and Zhang, Min and Li, Juntao},booktitle={Conference on Empirical Methods in Natural Language Processing (EMNLP)},year={2022},github_repo={zhaochen0110/LMLM},}