📝 Publications
[ISCA’25] Mao Lin, Yuan Feng, Guilherme Cox and Hyeran Jeon. “Forest: Access-aware GPU UVM Management”. The 52nd Annual International Symposium on Computer Architecture (ISCA), June 21–25, 2025, Tokyo, Japan. 🌐 ❞
Forest: Access-aware GPU UVM Management
@inproceedings{lin2025forest, author = {Lin, Mao and Feng, Yuan and Cox, Guilherme and Jeon, Hyeran}, title = {Forest: Access-aware GPU UVM Management}, year = {2025}, isbn = {9798400712616}, publisher = {Association for Computing Machinery}, address = {New York, NY, USA}, url = {https://doi.org/10.1145/3695053.3731047}, doi = {10.1145/3695053.3731047}, booktitle = {Proceedings of the 52nd Annual International Symposium on Computer Architecture}, pages = {137–152}, numpages = {16}, keywords = {Unified Virtual Memory, Prefetching, GPU, Memory Management}, location = { }, series = {ISCA '25} }
[EuroMLSys’25] Mao Lin and Hyeran Jeon. The 5th Workshop on Machine Learning and Systems, March 30–April 3, 2025, Rotterdam, Netherlands. “Understanding Oversubscribed Memory Management for Deep Learning Training”. 🌐 💬 ❞
Understanding Oversubscribed Memory Management for Deep Learning Training
@inproceedings{lin2025understanding, author = {Lin, Mao and Jeon, Hyeran}, title = {Understanding Oversubscribed Memory Management for Deep Learning Training}, year = {2025}, isbn = {9798400715389}, publisher = {Association for Computing Machinery}, address = {New York, NY, USA}, url = {https://doi.org/10.1145/3721146.3721955}, doi = {10.1145/3721146.3721955}, booktitle = {Proceedings of the 5th Workshop on Machine Learning and Systems}, pages = {46–55}, numpages = {10}, keywords = {GPU, unified virtual memory, performance analysis, DNN, LLM}, location = {World Trade Center, Rotterdam, Netherlands}, series = {EuroMLSys '25} }
[ASPLOS’23] Mao Lin, Keren Zhou, and Pengfei Su. “DrGPUM: Guiding Memory Optimization for GPU-accelerated Applications”. The 28th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Mar 25-29, 2023, Vancouver, BC, Canada. 🌐 🔗 💬 ❞
DrGPUM: Guiding Memory Optimization for GPU-accelerated Applications
@inproceedings{lin2023drgpum, author = {Lin, Mao and Zhou, Keren and Su, Pengfei}, title = {DrGPUM: Guiding Memory Optimization for GPU-Accelerated Applications}, year = {2023}, isbn = {9781450399180}, publisher = {Association for Computing Machinery}, address = {New York, NY, USA}, url = {https://doi.org/10.1145/3582016.3582044}, doi = {10.1145/3582016.3582044}, booktitle = {Proceedings of the 28th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 3}, pages = {164–178}, numpages = {15}, keywords = {CUDA, GPU profilers, GPUs, Memory management}, location = {Vancouver, BC, Canada}, series = {ASPLOS 2023} }
[PyTorch Conference’22] Mao Lin, Keren Zhou, and Pengfei Su. “Poster: Squeezing GPU Memory Usage in PyTorch”. Dec. 2022, New Orleans, LA, USA. 🌐
[TCAD’22] Zelin Du, Qianling Zhang, Mao Lin, Shiqing Li, Xin Li, and Lei Ju. “A comprehensive memory management framework for CPU-FPGA heterogenous SoCs”. IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems (2022). 🌐 ❞
A Comprehensive Memory Management Framework for CPU-FPGA Heterogeneous SoCs
@ARTICLE{9790045, author={Du, Zelin and Zhang, Qianling and Lin, Mao and Li, Shiqing and Li, Xin and Ju, Lei}, journal={IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems}, title={A Comprehensive Memory Management Framework for CPU-FPGA Heterogenous SoCs}, year={2023}, volume={42}, number={4}, pages={1058-1071}, doi={10.1109/TCAD.2022.3179323}}