Last active 1729171888

vLLM-readme-2.bib Raw
1@inproceedings{kwon2023efficient,
2 title={Efficient Memory Management for Large Language Model Serving with PagedAttention},
3 author={Woosuk Kwon and Zhuohan Li and Siyuan Zhuang and Ying Sheng and Lianmin Zheng and Cody Hao Yu and Joseph E. Gonzalez and Hao Zhang and Ion Stoica},
4 booktitle={Proceedings of the ACM SIGOPS 29th Symposium on Operating Systems Principles},
5 year={2023}
6}