@inproceedings{fu2025magellan,title={Magellan: A High-Performance Loop-Guided Prefetcher for Indirect Memory Access},author={Fu, Gelin and Xia, Tian and Yin, Mingzhuo and Nair, Prashant J. and Lis, Mieszko and Ren, Pengju},booktitle={Proceedings of the 52nd Annual International Symposium on Computer Architecture (ISCA)},pages={601--615},year={2025}}
TCAS-I
FP2: A 2-bit Floating-Point Format for Edge-AI Inference and Fine-Tuning
@article{dang2025fp2,title={FP2: A 2-bit Floating-Point Format for Edge-AI Inference and Fine-Tuning},author={Dang, Qiwei and Ma, Chengyu and Huang, Haiduo and Fu, Gelin and Huo, Zhiwang and Yang, Guoming and Zong, Pengchen and Xia, Tian and Zhao, Wenzhe and Ren, Pengju},journal={IEEE Transactions on Circuits and Systems I: Regular Papers},year={2025},publisher={IEEE}}
TCAD
Hierarchical-ISA Supporting Row-wise Operands for Efficient DNN Computation
Zhiwang Huo, Wenzhe Zhao, Qiwei Dang, Chengyu Ma, Guoming Yang, Gelin Fu, Tian Xia, and Pengju Ren
IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems, 2025
@article{huo2025hierarchical,title={Hierarchical-ISA Supporting Row-wise Operands for Efficient DNN Computation},author={Huo, Zhiwang and Zhao, Wenzhe and Dang, Qiwei and Ma, Chengyu and Yang, Guoming and Fu, Gelin and Xia, Tian and Ren, Pengju},journal={IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems},year={2025},publisher={IEEE}}
2024
HPCA
Differential-Matching Prefetcher for Indirect Memory Access
Gelin Fu, Tian Xia, Zhongpei Luo, Ruiyang Chen, Wenzhe Zhao, and Pengju Ren
In 2024 IEEE International Symposium on High-Performance Computer Architecture (HPCA), 2024
@inproceedings{fu2024differential,title={Differential-Matching Prefetcher for Indirect Memory Access},author={Fu, Gelin and Xia, Tian and Luo, Zhongpei and Chen, Ruiyang and Zhao, Wenzhe and Ren, Pengju},booktitle={2024 IEEE International Symposium on High-Performance Computer Architecture (HPCA)},pages={439--453},year={2024},organization={IEEE}}
2023
ICCD
PrSpMV: An Efficient Predictable Kernel for SpMV
Gelin Fu, Tian Xia, Shaoru Qu, Zhongpei Luo, Shuyu Li, Pengyu Cheng, Runfan Guo, Yitong Ding, and Pengju Ren
In 2023 IEEE 41st International Conference on Computer Design (ICCD), 2023
@inproceedings{fu2023prspmv,title={PrSpMV: An Efficient Predictable Kernel for SpMV},author={Fu, Gelin and Xia, Tian and Qu, Shaoru and Luo, Zhongpei and Li, Shuyu and Cheng, Pengyu and Guo, Runfan and Ding, Yitong and Ren, Pengju},booktitle={2023 IEEE 41st International Conference on Computer Design (ICCD)},pages={448--456},year={2023},organization={IEEE}}
2022
TCAS-I
An Energy-and-Area-Efficient CNN Accelerator for Universal Powers-of-Two Quantization
Tian Xia, Boran Zhao, Jian Ma, Gelin Fu, Wenzhe Zhao, Nanning Zheng, and Pengju Ren
IEEE Transactions on Circuits and Systems I: Regular Papers, 2022
@article{xia2022energy,title={An Energy-and-Area-Efficient CNN Accelerator for Universal Powers-of-Two Quantization},author={Xia, Tian and Zhao, Boran and Ma, Jian and Fu, Gelin and Zhao, Wenzhe and Zheng, Nanning and Ren, Pengju},journal={IEEE Transactions on Circuits and Systems I: Regular Papers},volume={70},number={3},pages={1242--1255},year={2022},publisher={IEEE}}
TPDS
A Comprehensive Performance Model of Sparse Matrix-Vector Multiplication to Guide Kernel Optimization
Tian Xia, Gelin Fu, Chenyang Li, Zhongpei Luo, Lucheng Zhang, Ruiyang Chen, Wenzhe Zhao, Nanning Zheng, and Pengju Ren
IEEE Transactions on Parallel and Distributed Systems, 2022
@article{xia2022comprehensive,title={A Comprehensive Performance Model of Sparse Matrix-Vector Multiplication to Guide Kernel Optimization},author={Xia, Tian and Fu, Gelin and Li, Chenyang and Luo, Zhongpei and Zhang, Lucheng and Chen, Ruiyang and Zhao, Wenzhe and Zheng, Nanning and Ren, Pengju},journal={IEEE Transactions on Parallel and Distributed Systems},volume={34},number={2},pages={519--534},year={2022},publisher={IEEE}}