@article{chen2025intflash,title={INT-FlashAttention: Enabling Flash Attention for INT8 Quantization},author={Chen, Shimao and Liu, Zirui and Wu, Zhiying and Zheng, Ce and Cong, Peizhuang and Jiang, Zihan and Wu, Yuhan and Su, Lei and Yang, Tong},journal={arXiv preprint 2409.16997},year={2025},}
TOIS
CAFE+: Towards Compact, Adaptive, and Fast Embedding for Large-scale Online Recommendation Models
@article{liu2025cafe+,title={CAFE+: Towards Compact, Adaptive, and Fast Embedding for Large-scale Online Recommendation Models},author={Liu, Zirui and Zhang, Hailin and Chen, Boxuan and Jiang, Zihan and Zhao, Yikai and Tao, Yangyu and Yang, Tong and Cui, Bin},journal={ACM Transactions on Information Systems},year={2025},publisher={ACM},}
ICDE
Extendible RDMA-based Remote Memory KV Store with Dynamic Perfect Hashing Index
@inproceedings{liu2025extendible,title={Extendible RDMA-based Remote Memory KV Store with Dynamic Perfect Hashing Index},author={Liu, Zirui and Niu, Xian and Zhou, Wei and Hong, Yisen and Shi, Zhouran and Yang, Tong and Zhang, Yuchao and Wu, Yuhan and Zhao, Yikai and Fan, Zhuochen and Cui, Bin},booktitle={Proceedings of the IEEE 41th International Conference on Data Engineering (ICDE)},year={2025},organization={IEEE},}
ICDE
CuckooGraph: A Scalable and Space-Time Efficient Data Structure for Large-Scale Dynamic Graphs
Zhuochen Fan#, Yalun Cai#, Zirui Liu#, Jiarui Guo, Xin Fan, Tong Yang, and Bin Cui
In Proceedings of the IEEE 41th International Conference on Data Engineering (ICDE), May 2025
@inproceedings{fan2025cuckoograph,title={CuckooGraph: A Scalable and Space-Time Efficient Data Structure for Large-Scale Dynamic Graphs},author={Fan, Zhuochen and Cai, Yalun and Liu, Zirui and Guo, Jiarui and Fan, Xin and Yang, Tong and Cui, Bin},booktitle={Proceedings of the IEEE 41th International Conference on Data Engineering (ICDE)},year={2025},organization={IEEE},}
ICDE
HourglassSketch: An Efficient and Scalable Framework for Graph Stream Summarization
Jiarui Guo#, Boxuan Chen#, Kaicheng Yang#, Tong Yang, Zirui Liu, Qiuheng Yin, Sha Wang, Yuhan Wu, Xiaolin Wang, Bin Cui, and
4 more authors
In Proceedings of the IEEE 41th International Conference on Data Engineering (ICDE), May 2025
@inproceedings{guo2025hourglassssketch,title={HourglassSketch: An Efficient and Scalable Framework for Graph Stream Summarization},author={Guo, Jiarui and Chen, Boxuan and Yang, Kaicheng and Yang, Tong and Liu, Zirui and Yin, Qiuheng and Wang, Sha and Wu, Yuhan and Wang, Xiaolin and Cui, Bin and Li, Tao and Peng, Xi and Chen, Renhai and Zhang, Gong},booktitle={Proceedings of the IEEE 41th International Conference on Data Engineering (ICDE)},year={2025},organization={IEEE},}
2024
VLDBJ
Enabling Space-Time Efficient Range Queries with REncoder
@article{fan2024enabling,author={Fan, Zhuochen and Ye, Bowen and Wang, Ziwei and Zhong, Zheng and Guo, Jiarui and Wu, Yuhan and Li, Haoyu and Yang, Tong and Tu, Yaofeng and Liu, Zirui and Cui, Bin},journal={The VLDB Journal},year={2024},publisher={Springer},}
VLDBJ
WavingSketch: An Unbiased and Generic Sketch for Finding Top-k Items in Data Streams
Zirui Liu, Fenghao Dong, Chengwu Liu, Xiangwei Deng, Tong Yang, Yikai Zhao, Jizhou Li, Bin Cui, and Gong Zhang
@article{liu2024waving,title={WavingSketch: An Unbiased and Generic Sketch for Finding Top-k Items in Data Streams},author={Liu, Zirui and Dong, Fenghao and Liu, Chengwu and Deng, Xiangwei and Yang, Tong and Zhao, Yikai and Li, Jizhou and Cui, Bin and Zhang, Gong},journal={The VLDB Journal},year={2024},publisher={Springer},}
TKDE
A Unified Framework for Mining Batch and Periodic Batch in Data Streams
@article{liu2024hypercalm,title={A Unified Framework for Mining Batch and Periodic Batch in Data Streams},author={Liu, Zirui and Wang, Xiangyuan and Wu, Yuhan and Yang, Tong and Yang, Kaicheng and Zhang, Hailin and Tu, Yaofeng and Cui, Bin},journal={IEEE Transactions on Knowledge and Data Engineering},year={2024},publisher={IEEE},}
VLDB
Experimental Analysis of Large-scale Learnable Vector Storage Compression
@article{zhang2024experimental,title={Experimental Analysis of Large-scale Learnable Vector Storage Compression},author={Zhang, Hailin and Zhao, Penghao and Miao, Xupeng and Shao, Yingxia and Liu, Zirui and Yang, Tong and Cui, Bin},journal={In Proceedings of the 50th International Conference on Very Large Databases (VLDB)},year={2024},publisher={ACM},}
SIGMOD
CAFE: Towards Compact, Adaptive, and Fast Embedding for Large-scale Recommendation Models (Honorable Mention for Best Artifact)
@article{zhang2024cafe,title={CAFE: Towards Compact, Adaptive, and Fast Embedding for Large-scale Recommendation Models <font color="red">(Honorable Mention for Best Artifact)</font>},author={Zhang, Hailin and Liu, Zirui and Chen, Boxuan and Zhao, Yikai and Zhao, Tong and Yang, Tong and Cui, Bin},journal={In Proceedings of the 2024 ACM International Conference on Management of Data (SIGMOD)},year={2024},publisher={ACM New York, NY, USA},}
2023
TPDS
SketchINT: Empowering INT with TowerSketch for Per-flow Per-switch Measurement
@article{yang2023sketchint,title={SketchINT: Empowering INT with TowerSketch for Per-flow Per-switch Measurement},author={Yang, Kaicheng and Long, Sheng and Shi, Qilong and Li, Yuanpeng and Liu, Zirui and Wu, Yuhan and Yang, Tong and Jia, Zhengyi},journal={IEEE Transactions on Parallel and Distributed Systems},year={2023},publisher={IEEE},}
TPDS
BurstBalancer: Do Less, Better Balance for Large-scale Data Center Traffic
Zirui Liu#, Yikai Zhao#, Zhuochen Fan#, Tong Yang, Xiaodong Li, Ruwen Zhang, Kaicheng Yang, Zihan Jiang, Zheng Zhong, Yi Huang, and
4 more authors
IEEE Transactions on Parallel and Distributed Systems, Jul 2023
@article{liu2023burstbalancer,title={BurstBalancer: Do Less, Better Balance for Large-scale Data Center Traffic},author={Liu, Zirui and Zhao, Yikai and Fan, Zhuochen and Yang, Tong and Li, Xiaodong and Zhang, Ruwen and Yang, Kaicheng and Jiang, Zihan and Zhong, Zheng and Huang, Yi and Liu, Cong and Hu, Jing and Xie, Gaogang and Cui, Bin},journal={IEEE Transactions on Parallel and Distributed Systems},year={2023},publisher={IEEE},}
SIGCOMM
ChameleMon: Shifting Measurement Attention as Network State Changes
Kaicheng Yang#, Yuhan Wu#, Ruijie Miao#, Tong Yang, Zirui Liu, Zicang Xu, Rui Qiu, Yikai Zhao, Hanglong Lv, Zhigang Ji, and
1 more author
In Proceedings of the 2023 Conference of the ACM Special Interest Group on Data Communication (SIGCOMM), Sep 2023
@inproceedings{yang2023chamelemon,title={ChameleMon: Shifting Measurement Attention as Network State Changes},author={Yang, Kaicheng and Wu, Yuhan and Miao, Ruijie and Yang, Tong and Liu, Zirui and Xu, Zicang and Qiu, Rui and Zhao, Yikai and Lv, Hanglong and Ji, Zhigang and Xie, Gaogang},booktitle={Proceedings of the 2023 Conference of the ACM Special Interest Group on Data Communication (SIGCOMM)},year={2023},publisher={ACM New York, NY, USA},}
SIGCOMM
P4LRU: Towards An LRU Cache Entirely in Programmable Data Plane
Yikai Zhao#, Wenrui Liu#, Fenghao Dong, Tong Yang, Yuanpeng Li, Kaicheng Yang, Zirui Liu, Zhengyi Jia, and Yongqiang Yang
In Proceedings of the 2023 Conference of the ACM Special Interest Group on Data Communication (SIGCOMM), Sep 2023
@inproceedings{zhao2023p4lru,title={P4LRU: Towards An LRU Cache Entirely in Programmable Data Plane},author={Zhao, Yikai and Liu, Wenrui and Dong, Fenghao and Yang, Tong and Li, Yuanpeng and Yang, Kaicheng and Liu, Zirui and Jia, Zhengyi and Yang, Yongqiang},booktitle={Proceedings of the 2023 Conference of the ACM Special Interest Group on Data Communication (SIGCOMM)},year={2023},publisher={ACM New York, NY, USA},}
SIGMOD
TreeSensing: Linearly Compressing Sketches with Flexibility
Zirui Liu, Yixin Zhang, Yifan Zhu, Ruwen Zhang, Tong Yang, Kun Xie, Sha Wang, Tao Li, and Bin Cui
In Proceedings of the 2023 ACM International Conference on Management of Data (SIGMOD), Jun 2023
@article{liu2023treesensing,title={TreeSensing: Linearly Compressing Sketches with Flexibility},author={Liu, Zirui and Zhang, Yixin and Zhu, Yifan and Zhang, Ruwen and Yang, Tong and Xie, Kun and Wang, Sha and Li, Tao and Cui, Bin},journal={In Proceedings of the 2023 ACM International Conference on Management of Data (SIGMOD)},volume={1},number={1},pages={1--28},year={2023},publisher={ACM New York, NY, USA},doi={10.1145/3588910},}
ICDE
HyperCalm Sketch: One-pass Mining Periodic Batches in Data Streams
Zirui Liu#, Chaozhe Kong#, Kaicheng Yang#, Tong Yang, Ruijie Miao, Qizhi Chen, Yikai Zhao, Yaofeng Tu, and Bin Cui
In Proceedings of the IEEE 39th International Conference on Data Engineering (ICDE), Apr 2023
@inproceedings{liu2023hypercalm,title={HyperCalm Sketch: One-pass Mining Periodic Batches in Data Streams},author={Liu, Zirui and Kong, Chaozhe and Yang, Kaicheng and Yang, Tong and Miao, Ruijie and Chen, Qizhi and Zhao, Yikai and Tu, Yaofeng and Cui, Bin},booktitle={Proceedings of the IEEE 39th International Conference on Data Engineering (ICDE)},year={2023},organization={IEEE},}
2022
ICNP
BurstBalancer: Do Less, Better Balance for Large-scale Data Center Traffic
Zirui Liu#, Yikai Zhao#, Zhuochen Fan#, Tong Yang, Xiaodong Li, Ruwen Zhang, Kaicheng Yang, Zheng Zhong, Yi Huang, Cong Liu, and
3 more authors
In Proceedings of the IEEE 30th International Conference on Network Protocols (ICNP), Nov 2022
@inproceedings{liu2022burstbalancer,title={BurstBalancer: Do Less, Better Balance for Large-scale Data Center Traffic},author={Liu, Zirui and Zhao, Yikai and Fan, Zhuochen and Yang, Tong and Li, Xiaodong and Zhang, Ruwen and Yang, Kaicheng and Zhong, Zheng and Huang, Yi and Liu, Cong and Hu, Jing and Xie, Gaogang and Cui, Bin},booktitle={Proceedings of the IEEE 30th International Conference on Network Protocols (ICNP)},pages={1--13},year={2022},organization={IEEE},doi={10.1109/ICNP55882.2022.9940372},}
2021
ICNP
SketchINT: Empowering INT with TowerSketch for Per-flow Per-switch Measurement
Kaicheng Yang#, Yuanpeng Li#, Zirui Liu#, Tong Yang, Yu Zhou, Jintao He, Tong Zhao, Zhengyi Jia, and Yongqiang Yang
In Proceedings of the IEEE 29th International Conference on Network Protocols (ICNP), Nov 2021
@inproceedings{yang2021sketchint,title={SketchINT: Empowering INT with TowerSketch for Per-flow Per-switch Measurement},author={Yang, Kaicheng and Li, Yuanpeng and Liu, Zirui and Yang, Tong and Zhou, Yu and He, Jintao and Zhao, Tong and Jia, Zhengyi and Yang, Yongqiang},booktitle={Proceedings of the IEEE 29th International Conference on Network Protocols (ICNP)},pages={1--12},year={2021},organization={IEEE},doi={10.1109/ICNP52444.2021.9651940},}
SIGKDD
MapEmbed: Perfect Hashing with High Load Factor and Fast Update
Yuhan Wu#, Zirui Liu#, Xiang Yu#, Jie Gui, Haochen Gan, Yuhao Han, Tao Li, Ori Rottenstreich, and Tong Yang
In Proceedings of the 27th ACM SIGKDD Conference on Knowledge Discovery & Data Mining, Aug 2021
@inproceedings{wu2021mapembed,title={MapEmbed: Perfect Hashing with High Load Factor and Fast Update},author={Wu, Yuhan and Liu, Zirui and Yu, Xiang and Gui, Jie and Gan, Haochen and Han, Yuhao and Li, Tao and Rottenstreich, Ori and Yang, Tong},booktitle={Proceedings of the 27th ACM SIGKDD Conference on Knowledge Discovery & Data Mining},pages={1863–1872},year={2021},publisher={ACM New York, NY, USA},doi={10.1145/3447548.3467240},}
NSDI
LightGuardian: A Full-visibility, Lightweight, In-band Telemetry System Using Sketchlets
Yikai Zhao#, Kaicheng Yang#, Zirui Liu#, Tong Yang, Li Chen, Shiyi Liu, Naiqian Zheng, Ruixin Wang, Hanbo Wu, Yi Wang, and
1 more author
In Proceedings of the 18th USENIX Symposium on Networked Systems Design and Implementation (NSDI), Apr 2021
@inproceedings{zhao2021lightguardian,title={LightGuardian: A Full-visibility, Lightweight, In-band Telemetry System Using Sketchlets},author={Zhao, Yikai and Yang, Kaicheng and Liu, Zirui and Yang, Tong and Chen, Li and Liu, Shiyi and Zheng, Naiqian and Wang, Ruixin and Wu, Hanbo and Wang, Yi and Zhang, Nicholas},booktitle={Proceedings of the 18th USENIX Symposium on Networked Systems Design and Implementation (NSDI)},pages={991--1010},year={2021},publisher={USENIX Association},}