Publications | Zhaochen Su

2026

Tech Report

Kimi K2.5: Visual Agentic Intelligence

Kimi Team

arXiv preprint arXiv:2602.02276, 2026

@article{kimiteam2026k25,
  title = {Kimi K2.5: Visual Agentic Intelligence},
  author = {{Kimi Team}},
  journal = {arXiv preprint arXiv:2602.02276},
  year = {2026},
  github_repo = {MoonshotAI/Kimi-K2.5},
}

Tech Report

The MiniMax-M2 Series: Mini Activations Unleashing Max Real-World Intelligence

MiniMax

arXiv preprint arXiv:2605.26494, 2026

arXiv Bib Code

@article{minimax2026m2,
  title = {The MiniMax-M2 Series: Mini Activations Unleashing Max Real-World Intelligence},
  author = {{MiniMax}},
  journal = {arXiv preprint arXiv:2605.26494},
  year = {2026},
  github_repo = {MiniMax-AI/MiniMax-M2},
}

ICML 2026

XSkill: Continual Learning from Experience and Skills in Multimodal Agents

Guanyu Jiang, Zhaochen Su, Xiaoye Qu, and Yi R. (May) Fung

In International Conference on Machine Learning (ICML). Guanyu Jiang and Zhaochen Su contributed equally , 2026

arXiv Bib Code

@inproceedings{jiang2026xskill,
  title = {XSkill: Continual Learning from Experience and Skills in Multimodal Agents},
  author = {Jiang, Guanyu and Su, Zhaochen and Qu, Xiaoye and Fung, Yi R. (May)},
  booktitle = {International Conference on Machine Learning (ICML)},
  year = {2026},
  github_repo = {XSkill-Agent/XSkill},
}

arXiv

AgentVista: Evaluating Multimodal Agents in Ultra-Challenging Realistic Visual Scenarios

Zhaochen Su, Jincheng Gao, Hangyu Guo, Zhenhua Liu, Lueyang Zhang, Xinyu Geng, Shijue Huang, Peng Xia, Guanyu Jiang, Cheng Wang, Yue Zhang, Yi R. (May) Fung, and Junxian He

arXiv preprint arXiv:2602.23166, 2026

arXiv Bib Code

@article{su2026agentvista,
  title = {AgentVista: Evaluating Multimodal Agents in Ultra-Challenging Realistic Visual Scenarios},
  author = {Su, Zhaochen and Gao, Jincheng and Guo, Hangyu and Liu, Zhenhua and Zhang, Lueyang and Geng, Xinyu and Huang, Shijue and Xia, Peng and Jiang, Guanyu and Wang, Cheng and Zhang, Yue and Fung, Yi R. (May) and He, Junxian},
  journal = {arXiv preprint arXiv:2602.23166},
  year = {2026},
  github_repo = {hkust-nlp/AgentVista},
}

ICLR 2026

The Tool Decathlon: Benchmarking Language Agents for Diverse, Realistic, and Long-Horizon Task Execution

Junlong Li, Wenshuo Zhao, Jian Zhao, Weihao Zeng, Haoze Wu, Xiaochen Wang, Rui Ge, Yuxuan Cao, Yuzhen Huang, Wei Liu, Junteng Liu, Zhaochen Su, Yiyang Guo, Fan Zhou, Lueyang Zhang, Juan Michelini, Xingyao Wang, Xiang Yue, Shuyan Zhou, Graham Neubig, and Junxian He

In International Conference on Learning Representations (ICLR), 2026

arXiv Bib Code

@inproceedings{li2026toolathlon,
  title = {The Tool Decathlon: Benchmarking Language Agents for Diverse, Realistic, and Long-Horizon Task Execution},
  author = {Li, Junlong and Zhao, Wenshuo and Zhao, Jian and Zeng, Weihao and Wu, Haoze and Wang, Xiaochen and Ge, Rui and Cao, Yuxuan and Huang, Yuzhen and Liu, Wei and Liu, Junteng and Su, Zhaochen and Guo, Yiyang and Zhou, Fan and Zhang, Lueyang and Michelini, Juan and Wang, Xingyao and Yue, Xiang and Zhou, Shuyan and Neubig, Graham and He, Junxian},
  booktitle = {International Conference on Learning Representations (ICLR)},
  year = {2026},
  github_repo = {hkust-nlp/Toolathlon},
}

ICLR 2026

GRACE: Generative Representation Learning via Contrastive Policy Optimization

Jiashuo Sun, Shixuan Liu, Zhaochen Su, Xianrui Zhong, Pengcheng Jiang, Bowen Jin, Peiran Li, Weijia Shi, and Jiawei Han

In International Conference on Learning Representations (ICLR), 2026

arXiv Bib Code

@inproceedings{sun2026grace,
  title = {GRACE: Generative Representation Learning via Contrastive Policy Optimization},
  author = {Sun, Jiashuo and Liu, Shixuan and Su, Zhaochen and Zhong, Xianrui and Jiang, Pengcheng and Jin, Bowen and Li, Peiran and Shi, Weijia and Han, Jiawei},
  booktitle = {International Conference on Learning Representations (ICLR)},
  year = {2026},
  github_repo = {GasolSun36/GRACE},
}

ICLR 2026

Advancing Multimodal Reasoning: From Optimized Cold Start to Staged Reinforcement Learning

Shuang Chen, Yue Guo, Zhaochen Su, Yafu Li, Yulun Wu, Jiacheng Chen, Jiayu Chen, Weijie Wang, Xiaoye Qu, and Yu Cheng

In International Conference on Learning Representations (ICLR), 2026

arXiv Bib Code

@inproceedings{chen2026advancing,
  title = {Advancing Multimodal Reasoning: From Optimized Cold Start to Staged Reinforcement Learning},
  author = {Chen, Shuang and Guo, Yue and Su, Zhaochen and Li, Yafu and Wu, Yulun and Chen, Jiacheng and Chen, Jiayu and Wang, Weijie and Qu, Xiaoye and Cheng, Yu},
  booktitle = {International Conference on Learning Representations (ICLR)},
  year = {2026},
  github_repo = {CSfufu/Revisual-R1},
}

2025

arXiv

Thinking with Images for Multimodal Reasoning: Foundations, Methods, and Future Frontiers

Zhaochen Su, Peng Xia, Hangyu Guo, Zhenhua Liu, Yan Ma, Xiaoye Qu, Jiaqi Liu, Yanshu Li, Kaide Zeng, Zhengyuan Yang, Linjie Li, Yu Cheng, Heng Ji, Junxian He, and Yi R. Fung

arXiv preprint arXiv:2506.23918, 2025

arXiv Bib Code

@article{su2025thinking,
  title = {Thinking with Images for Multimodal Reasoning: Foundations, Methods, and Future Frontiers},
  author = {Su, Zhaochen and Xia, Peng and Guo, Hangyu and Liu, Zhenhua and Ma, Yan and Qu, Xiaoye and Liu, Jiaqi and Li, Yanshu and Zeng, Kaide and Yang, Zhengyuan and Li, Linjie and Cheng, Yu and Ji, Heng and He, Junxian and Fung, Yi R.},
  journal = {arXiv preprint arXiv:2506.23918},
  year = {2025},
  github_repo = {zhaochen0110/Awesome_Think_With_Images},
}

arXiv

OpenThinkIMG: Learning to Think with Images via Visual Tool Reinforcement Learning

Zhaochen Su, Linjie Li, Mingyang Song, Yunzhuo Hao, Zhengyuan Yang, Jun Zhang, Guanjie Chen, Jiawei Gu, Juntao Li, Xiaoye Qu, and Yu Cheng

arXiv preprint arXiv:2505.08617, 2025

arXiv Bib Code

@article{su2025openthinkimg,
  title = {OpenThinkIMG: Learning to Think with Images via Visual Tool Reinforcement Learning},
  author = {Su, Zhaochen and Li, Linjie and Song, Mingyang and Hao, Yunzhuo and Yang, Zhengyuan and Zhang, Jun and Chen, Guanjie and Gu, Jiawei and Li, Juntao and Qu, Xiaoye and Cheng, Yu},
  journal = {arXiv preprint arXiv:2505.08617},
  year = {2025},
  github_repo = {zhaochen0110/OpenThinkIMG},
}

ACL 2025

PRMBench: A Fine-grained and Challenging Benchmark for Process-Level Reward Models

Mingyang Song, Zhaochen Su, Xiaoye Qu, Jiawei Zhou, and Yu Cheng

In Annual Meeting of the Association for Computational Linguistics (ACL), 2025

arXiv Bib Code

@inproceedings{song2025prmbench,
  title = {PRMBench: A Fine-grained and Challenging Benchmark for Process-Level Reward Models},
  author = {Song, Mingyang and Su, Zhaochen and Qu, Xiaoye and Zhou, Jiawei and Cheng, Yu},
  booktitle = {Annual Meeting of the Association for Computational Linguistics (ACL)},
  year = {2025},
  github_repo = {ssmisya/PRMBench},
}

2024

NeurIPS 2024

ConflictBank: A Benchmark for Evaluating Knowledge Conflicts in Large Language Models

Zhaochen Su, Jun Zhang, Xiaoye Qu, Tong Zhu, Yanshu Li, Jiashuo Sun, Juntao Li, Min Zhang, and Yu Cheng

In Advances in Neural Information Processing Systems (NeurIPS), 2024

arXiv Bib Code

@inproceedings{su2024conflictbank,
  title = {ConflictBank: A Benchmark for Evaluating Knowledge Conflicts in Large Language Models},
  author = {Su, Zhaochen and Zhang, Jun and Qu, Xiaoye and Zhu, Tong and Li, Yanshu and Sun, Jiashuo and Li, Juntao and Zhang, Min and Cheng, Yu},
  booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
  year = {2024},
  github_repo = {zhaochen0110/conflictbank},
}

COLM 2024

Timo: Towards Better Temporal Reasoning for Language Models

Zhaochen Su, Jun Zhang, Tong Zhu, Xiaoye Qu, Juntao Li, Min Zhang, and Yu Cheng

In Conference on Language Modeling (COLM), 2024

arXiv Bib Code

@inproceedings{su2024timo,
  title = {Timo: Towards Better Temporal Reasoning for Language Models},
  author = {Su, Zhaochen and Zhang, Jun and Zhu, Tong and Qu, Xiaoye and Li, Juntao and Zhang, Min and Cheng, Yu},
  booktitle = {Conference on Language Modeling (COLM)},
  year = {2024},
  github_repo = {zhaochen0110/Timo},
}

ACL 2024

Living in the Moment: Can Large Language Models Grasp Co-Temporal Reasoning?

Zhaochen Su, Juntao Li, Jun Zhang, Tong Zhu, Xiaoye Qu, Pan Zhou, Yan Bowen, Yu Cheng, and Min Zhang

In Annual Meeting of the Association for Computational Linguistics (ACL), 2024

Oral arXiv Bib Code

Oral presentation at ACL 2024

@inproceedings{su2024living,
  title = {Living in the Moment: Can Large Language Models Grasp Co-Temporal Reasoning?},
  author = {Su, Zhaochen and Li, Juntao and Zhang, Jun and Zhu, Tong and Qu, Xiaoye and Zhou, Pan and Bowen, Yan and Cheng, Yu and Zhang, Min},
  booktitle = {Annual Meeting of the Association for Computational Linguistics (ACL)},
  year = {2024},
  github_repo = {zhaochen0110/Cotempqa},
}

EMNLP 2024

SURf: Teaching Large Vision-Language Models to Selectively Utilize Retrieved Information

Jiashuo Sun, Jihai Zhang, Yucheng Zhou, Zhaochen Su, Xiaoye Qu, and Yu Cheng

In Conference on Empirical Methods in Natural Language Processing (EMNLP), 2024

arXiv Bib Code

@inproceedings{sun2024surf,
  title = {SURf: Teaching Large Vision-Language Models to Selectively Utilize Retrieved Information},
  author = {Sun, Jiashuo and Zhang, Jihai and Zhou, Yucheng and Su, Zhaochen and Qu, Xiaoye and Cheng, Yu},
  booktitle = {Conference on Empirical Methods in Natural Language Processing (EMNLP)},
  year = {2024},
  github_repo = {GasolSun36/SURf},
}

2023

EMNLP 2023

Efficient Continue Training of Temporal Language Model with Structural Information

Zhaochen Su, Juntao Li, Zikang Zhang, Zihan Zhou, and Min Zhang

In Findings of the Association for Computational Linguistics: EMNLP 2023, 2023

Bib PDF

@inproceedings{su2023efficient,
  title = {Efficient Continue Training of Temporal Language Model with Structural Information},
  author = {Su, Zhaochen and Li, Juntao and Zhang, Zikang and Zhou, Zihan and Zhang, Min},
  booktitle = {Findings of the Association for Computational Linguistics: EMNLP 2023},
  year = {2023},
}

2022

EMNLP 2022

Improving Temporal Generalization of Pre-trained Language Models with Lexical Semantic Change

Zhaochen Su, Zecheng Tang, Xinyan Guan, Lijun Wu, Min Zhang, and Juntao Li

In Conference on Empirical Methods in Natural Language Processing (EMNLP), 2022

Bib PDF Code

@inproceedings{su2022improving,
  title = {Improving Temporal Generalization of Pre-trained Language Models with Lexical Semantic Change},
  author = {Su, Zhaochen and Tang, Zecheng and Guan, Xinyan and Wu, Lijun and Zhang, Min and Li, Juntao},
  booktitle = {Conference on Empirical Methods in Natural Language Processing (EMNLP)},
  year = {2022},
  github_repo = {zhaochen0110/LMLM},
}