Publications

ChipMATE: Multi-Agent Training via Reinforcement Learning for Enhanced RTL Generation

Zhongkai Yu, Yichen Lin, Chenyang Zhou, Yuwei Zhang, Kun Zhou, Junxia Cui, Haotian Ye, Zhengding Hu, Zaifeng Pan, Ruiyi Wang, Yujie Zhao, Hejia Zhang, Jingbo Shang, Jishen Zhao, Yufei Ding

arXiv preprint arXiv:2605.12857, 2026

@article{yu2026chipmate, title={ChipMATE: Multi-Agent Training via Reinforcement Learning for Enhanced RTL Generation}, author={Yu, Zhongkai and Lin, Yichen and Zhou, Chenyang and Zhang, Yuwei and Zhou, Kun and Cui, Junxia and Ye, Haotian and Hu, Zhengding and Pan, Zaifeng and Wang, Ruiyi and Zhao, Yujie and Zhang, Hejia and Shang, Jingbo and Zhao, Jishen and Ding, Yufei}, journal={arXiv preprint arXiv:2605.12857}, year={2026} }

ChipBench: A Next-Step Benchmark for Evaluating LLM Performance in AI-Aided Chip Design

Zhongkai Yu*, Chenyang Zhou*, Yichen Lin, Hejia Zhang, Haotian Ye, Junxia Cui, Zaifeng Pan, Jishen Zhao, Yufei Ding

arXiv preprint arXiv:2601.21448, 2026

@article{yu2026chipbench, title={ChipBench: A Next-Step Benchmark for Evaluating LLM Performance in AI-Aided Chip Design}, author={Yu, Zhongkai and Zhou, Chenyang and Lin, Yichen and Zhang, Hejia and Ye, Haotian and Cui, Junxia and Pan, Zaifeng and Zhao, Jishen and Ding, Yufei}, journal={arXiv preprint arXiv:2601.21448}, year={2026} }

AMMA: A Multi-Chiplet Memory-Centric Architecture for Low-Latency 1M Context Attention Serving

Zhongkai Yu, Haotian Ye, Chenyang Zhou, Ohm Rishabh Venkatachalam, Zaifeng Pan, Zhengding Hu, Junsung Kim, Won Woo Ro, Po-An Tsai, Shuyi Pei, Yangwook Kang, Yufei Ding

arXiv preprint arXiv:2604.26103, 2026

@article{yu2026amma, title={AMMA: A Multi-Chiplet Memory-Centric Architecture for Low-Latency 1M Context Attention Serving}, author={Yu, Zhongkai and Ye, Haotian and Zhou, Chenyang and Venkatachalam, Ohm Rishabh and Pan, Zaifeng and Hu, Zhengding and Kim, Junsung and Ro, Won Woo and Tsai, Po-An and Pei, Shuyi and Kang, Yangwook and Ding, Yufei}, journal={arXiv preprint arXiv:2604.26103}, year={2026} }

Assassyn: A Unified Abstraction for Architectural Simulation and Implementation

Jian Weng, Boyang Han, Derui Gao, Ruijie Gao, Wanning Zhang, An Zhong, Ceyu Xu, Jihao Xin, Yangzhixin Luo, Lisa Wu Wills, et al.

Proceedings of the 52nd Annual International Symposium on Computer Architecture (ISCA), pp. 1464–1479, 2025

@inproceedings{weng2025assassyn, title={Assassyn: A Unified Abstraction for Architectural Simulation and Implementation}, author={Weng, Jian and Han, Boyang and Gao, Derui and Gao, Ruijie and Zhang, Wanning and Zhong, An and Xu, Ceyu and Xin, Jihao and Luo, Yangzhixin and Wills, Lisa Wu and others}, booktitle={Proceedings of the 52nd Annual International Symposium on Computer Architecture (ISCA)}, pages={1464–1479}, year={2025} }

Patterns behind Chaos: Forecasting Data Movement for Efficient Large-Scale MoE LLM Inference

Zhongkai Yu, Yue Guan, Zihao Yu, Chenyang Zhou, Shuyi Pei, Yangwook Kang, Yufei Ding, Po-An Tsai

Proceedings of the 53rd Annual International Symposium on Computer Architecture (ISCA), 2026

Best Paper Candidate

@inproceedings{yu2026patterns, title={Patterns behind Chaos: Forecasting Data Movement for Efficient Large-Scale MoE LLM Inference}, author={Yu, Zhongkai and Guan, Yue and Yu, Zihao and Zhou, Chenyang and Pei, Shuyi and Kang, Yangwook and Ding, Yufei and Tsai, Po-An}, booktitle={Proceedings of the 53rd Annual International Symposium on Computer Architecture (ISCA)}, year={2026} }