Publications | Xueyi Chen

2026

StreamingTOM: Streaming Token Compression for Efficient Video Understanding

Xueyi Chen, Keda Tao, Kele Shao, and Huan Wang

In IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR), 2026

@inproceedings{chen2025streamingtom,
  title = {StreamingTOM: Streaming Token Compression for Efficient Video Understanding},
  author = {Chen, Xueyi and Tao, Keda and Shao, Kele and Wang, Huan},
  booktitle = {IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
  year = {2026},
}

ICLR-W

MobileKernelBench: Can LLMs Write Efficient Kernels for Mobile Devices?

Xingze Zou^*, Jing Wang^*, Yuhua Zheng, Haolei Bai, Xueyi Chen, Lingcheng Kong, Zhaode Wang, Chengfei Lv, Syed A.R. Abu-Bakar, Haoji Hu, and Huan Wang

In ICLR Workshop on Data-centric Foundation Models (DATA-FM), Mar 2026

arXiv Bib PDF Code Website

@inproceedings{zou2026mobilekernelbench,
  title = {MobileKernelBench: Can LLMs Write Efficient Kernels for Mobile Devices?},
  author = {Zou, Xingze and Wang, Jing and Zheng, Yuhua and Bai, Haolei and Chen, Xueyi and Kong, Lingcheng and Wang, Zhaode and Lv, Chengfei and Abu-Bakar, Syed A.R. and Hu, Haoji and Wang, Huan},
  booktitle = {ICLR Workshop on Data-centric Foundation Models (DATA-FM)},
  year = {2026},
  month = mar,
}

arXiv

LVOmniBench: Pioneering Long Audio-Video Understanding Evaluation for Omnimodal LLMs

Keda Tao^*, Yuhua Zheng^*, Jia Xu, Wenjie Du, Kele Shao, Hesong Wang, Xueyi Chen, Xin Jin, Junhan Zhu, Bohan Yu, Weiqiang Wang, Jian Liu, Can Qin, Yulun Zhang, Ming-Hsuan Yang, and Huan Wang

arXiv preprint arXiv:2603.19217, Mar 2026

Under review

arXiv Bib PDF Code Website

@article{tao2026lvomnibench,
  title = {LVOmniBench: Pioneering Long Audio-Video Understanding Evaluation for Omnimodal LLMs},
  author = {Tao, Keda and Zheng, Yuhua and Xu, Jia and Du, Wenjie and Shao, Kele and Wang, Hesong and Chen, Xueyi and Jin, Xin and Zhu, Junhan and Yu, Bohan and Wang, Weiqiang and Liu, Jian and Qin, Can and Zhang, Yulun and Yang, Ming-Hsuan and Wang, Huan},
  journal = {arXiv preprint arXiv:2603.19217},
  year = {2026},
  month = mar,
  note = {Under review},
}

arXiv

DICE: Diffusion Large Language Models Excel at Generating CUDA Kernels

Haolei Bai, Lingcheng Kong, Xueyi Chen, Jianmian Wang, Zhiqiang Tao, and Huan Wang

arXiv preprint arXiv:2602.11715, Feb 2026

Under review

arXiv Bib PDF Code Website

@article{bai2026dice,
  title = {DICE: Diffusion Large Language Models Excel at Generating CUDA Kernels},
  author = {Bai, Haolei and Kong, Lingcheng and Chen, Xueyi and Wang, Jianmian and Tao, Zhiqiang and Wang, Huan},
  journal = {arXiv preprint arXiv:2602.11715},
  year = {2026},
  month = feb,
  note = {Under review},
}

2025

NeurIPS

On-Policy Optimization with Group Equivalent Preference for Multi-Programming Language Understanding

Haoyuan Wu^*, Rui Ming^*, Jilong Gao^*, Hangyu Zhao, Xueyi Chen, Yikai Yang, Haisheng Zheng, Zhuolun He, and Bei Yu

In Advances in Neural Information Processing Systems (NeurIPS), Sep 2025

arXiv Bib PDF

@inproceedings{wu2025onpolicy,
  title = {On-Policy Optimization with Group Equivalent Preference for Multi-Programming Language Understanding},
  author = {Wu, Haoyuan and Ming, Rui and Gao, Jilong and Zhao, Hangyu and Chen, Xueyi and Yang, Yikai and Zheng, Haisheng and He, Zhuolun and Yu, Bei},
  booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
  year = {2025},
  month = sep,
  publisher = {NeurIPS},
}

arXiv

ToTRL: Unlock LLM Tree-of-Thoughts Reasoning Potential through Puzzles Solving

Haoyuan Wu^*, Xueyi Chen^*, Rui Ming, Jilong Gao, Shoubo Hu, Zhuolun He, and Bei Yu

arXiv preprint arXiv:2505.12717, May 2025

Under review

arXiv Bib PDF

@article{wu2025totrl,
  title = {ToTRL: Unlock LLM Tree-of-Thoughts Reasoning Potential through Puzzles Solving},
  author = {Wu, Haoyuan and Chen, Xueyi and Ming, Rui and Gao, Jilong and Hu, Shoubo and He, Zhuolun and Yu, Bei},
  journal = {arXiv preprint arXiv:2505.12717},
  year = {2025},
  month = may,
  note = {Under review},
}