@inproceedings{zhou2024anyprefer,title={AnyPrefer: An Agentic Framework for Preference Data Synthesis},author={Zhou, Yiyang and Wang, Zhaoyang and Wang, Tianle and Xing, Shangyu and Xia, Peng and Li, Bo and Zheng, Kaiyuan and Zhang, Zijian and Chen, Zhaorun and Zheng, Wenhao and Zhang, Xuchao and Bansal, Chetan and Zhang, Weitong and Wei, Ying and Bansal, Mohit and Yao, Huaxiu},booktitle={International Conference on Learning Representations},year={2025},}
preprint
GePBench: Evaluating Fundamental Geometric Perception for Multimodal Large Language Models
Shangyu Xing, Changhao Xiang, Yuteng Han, Yifan Yue, and 5 more authors
@article{xing2024gepbenchevaluatingfundamentalgeometric,title={GePBench: Evaluating Fundamental Geometric Perception for Multimodal Large Language Models},author={Xing, Shangyu and Xiang, Changhao and Han, Yuteng and Yue, Yifan and Wu, Zhen and Liu, Xinyu and Wu, Zhangtai and Zhao, Fei and Dai, Xinyu},year={2025},journal={submitted to ICML 2026},}
ACL
Maximizing the Effectiveness of Larger BERT Models for Compression
Wenshu Fan, Su Lu, Shangyu Xing, Xinchun Li, and 1 more author
@article{bert-comp,title={Maximizing the Effectiveness of Larger BERT Models for Compression},author={Fan, Wenshu and Lu, Su and Xing, Shangyu and Li, Xinchun and Zhan, Dechuan},year={2025},journal={ACL 2025 (main)},}
EMNLP
RealBench: A Chinese Multi-image Understanding Benchmark Close to Real-world Scenarios
Fei Zhao, Chengqiang Lu, Yufan Shen, Qimeng Wang, and 8 more authors
@article{realbench,title={RealBench: A Chinese Multi-image Understanding Benchmark Close to Real-world Scenarios},author={Zhao, Fei and Lu, Chengqiang and Shen, Yufan and Wang, Qimeng and Qian, Yicheng and Zhang, Haoxin and Gao, Yan and Hu, Yao and Wu, Zhen and Song, Dingjie and Xing, Shangyu and Dai, Xinyu},year={2025},journal={EMNLP 2025 (findings)}}
ICLR
Lookahead Tree-Based Rollouts for Enhanced Trajectory-Level Exploration in Reinforcement Learning with Verifiable Rewards
Shangyu Xing, Siyuan Wang, Chenyuan Yang, Xinyu Dai, and 1 more author
@article{rlvr-rollout,title={Lookahead Tree-Based Rollouts for Enhanced Trajectory-Level Exploration in Reinforcement Learning with Verifiable Rewards},author={Xing, Shangyu and Wang, Siyuan and Yang, Chenyuan and Dai, Xinyu and Ren, Xiang},year={2025},journal={ICLR 2026},}
2024
EMNLP
EFUF: Efficient Fine-grained Unlearning Framework for Mitigating Hallucinations in Multimodal Large Language Models
Shangyu Xing, Fei Zhao, Zhen Wu, Tuo An, and 4 more authors
@article{xing2024efuf,title={EFUF: Efficient Fine-grained Unlearning Framework for Mitigating Hallucinations in Multimodal Large Language Models},author={Xing, Shangyu and Zhao, Fei and Wu, Zhen and An, Tuo and Chen, Weihao and Li, Chunhui and Zhang, Jianbing and Dai, Xinyu},journal={EMNLP 2024 (main)},year={2024},}
preprint
AlignGPT: Multi-modal Large Language Models with Adaptive Alignment Capability
Fei Zhao, Taotian Pang, Chunhui Li, Zhen Wu, and 3 more authors
@article{zhao2024aligngpt,title={AlignGPT: Multi-modal Large Language Models with Adaptive Alignment Capability},author={Zhao, Fei and Pang, Taotian and Li, Chunhui and Wu, Zhen and Guo, Junjie and Xing, Shangyu and Dai, Xinyu},journal={preprint},year={2024},}
2023
ACMMM
DRIN: Dynamic Relation Interactive Network for Multimodal Entity Linking
Shangyu Xing*, Fei Zhao*, Zhen Wu, Chunhui Li, and 2 more authors
In Proceedings of the 31st ACM International Conference on Multimedia, 2023
@inproceedings{xing2023drin,title={DRIN: Dynamic Relation Interactive Network for Multimodal Entity Linking},author={Xing, Shangyu and Zhao, Fei and Wu, Zhen and Li, Chunhui and Zhang, Jianbing and Dai, Xinyu},booktitle={Proceedings of the 31st ACM International Conference on Multimedia},pages={3599--3608},year={2023},}
2022
ACMMM
Learning from different text-image pairs: a relation-enhanced graph convolutional network for multimodal NER
Fei Zhao, Chunhui Li, Zhen Wu, Shangyu Xing, and 1 more author
In Proceedings of the 30th ACM international conference on multimedia, 2022
@inproceedings{zhao2022learning,title={Learning from different text-image pairs: a relation-enhanced graph convolutional network for multimodal NER},author={Zhao, Fei and Li, Chunhui and Wu, Zhen and Xing, Shangyu and Dai, Xinyu},booktitle={Proceedings of the 30th ACM international conference on multimedia},pages={3983--3992},year={2022},}