Publications
ChipMATE: Multi-Agent Training via Reinforcement Learning for Enhanced RTL Generation
arXiv preprint arXiv:2605.12857, 2026
@article{yu2026chipmate, title={ChipMATE: Multi-Agent Training via Reinforcement Learning for Enhanced RTL Generation}, author={Yu, Zhongkai and Lin, Yichen and Zhou, Chenyang and Zhang, Yuwei and Zhou, Kun and Cui, Junxia and Ye, Haotian and Hu, Zhengding and Pan, Zaifeng and Wang, Ruiyi and Zhao, Yujie and Zhang, Hejia and Shang, Jingbo and Zhao, Jishen and Ding, Yufei}, journal={arXiv preprint arXiv:2605.12857}, year={2026} }
ChipBench: A Next-Step Benchmark for Evaluating LLM Performance in AI-Aided Chip Design
arXiv preprint arXiv:2601.21448, 2026
@article{yu2026chipbench, title={ChipBench: A Next-Step Benchmark for Evaluating LLM Performance in AI-Aided Chip Design}, author={Yu, Zhongkai and Zhou, Chenyang and Lin, Yichen and Zhang, Hejia and Ye, Haotian and Cui, Junxia and Pan, Zaifeng and Zhao, Jishen and Ding, Yufei}, journal={arXiv preprint arXiv:2601.21448}, year={2026} }
AMMA: A Multi-Chiplet Memory-Centric Architecture for Low-Latency 1M Context Attention Serving
arXiv preprint arXiv:2604.26103, 2026
@article{yu2026amma, title={AMMA: A Multi-Chiplet Memory-Centric Architecture for Low-Latency 1M Context Attention Serving}, author={Yu, Zhongkai and Ye, Haotian and Zhou, Chenyang and Venkatachalam, Ohm Rishabh and Pan, Zaifeng and Hu, Zhengding and Kim, Junsung and Ro, Won Woo and Tsai, Po-An and Pei, Shuyi and Kang, Yangwook and Ding, Yufei}, journal={arXiv preprint arXiv:2604.26103}, year={2026} }
Assassyn: A Unified Abstraction for Architectural Simulation and Implementation
Proceedings of the 52nd Annual International Symposium on Computer Architecture (ISCA), pp. 1464–1479, 2025
@inproceedings{weng2025assassyn, title={Assassyn: A Unified Abstraction for Architectural Simulation and Implementation}, author={Weng, Jian and Han, Boyang and Gao, Derui and Gao, Ruijie and Zhang, Wanning and Zhong, An and Xu, Ceyu and Xin, Jihao and Luo, Yangzhixin and Wills, Lisa Wu and others}, booktitle={Proceedings of the 52nd Annual International Symposium on Computer Architecture (ISCA)}, pages={1464–1479}, year={2025} }
Patterns behind Chaos: Forecasting Data Movement for Efficient Large-Scale MoE LLM Inference
Proceedings of the 53rd Annual International Symposium on Computer Architecture (ISCA), 2026
Best Paper Candidate
@inproceedings{yu2026patterns, title={Patterns behind Chaos: Forecasting Data Movement for Efficient Large-Scale MoE LLM Inference}, author={Yu, Zhongkai and Guan, Yue and Yu, Zihao and Zhou, Chenyang and Pei, Shuyi and Kang, Yangwook and Ding, Yufei and Tsai, Po-An}, booktitle={Proceedings of the 53rd Annual International Symposium on Computer Architecture (ISCA)}, year={2026} }