Zhengxu Xia, Yitian Hao, Jun Duan, Chen Wang, Junchen Jiang. Towards Optimal Preemptive GPU Time-Sharing for Edge Model Serving. In Proceedings of the 9th International Workshop on Container Technologies and Container Clouds, WoC 2023, Bologna, Italy, December 11-15, 2023. pages 13-18, ACM, 2023. [doi]
@inproceedings{XiaHDWJ23, title = {Towards Optimal Preemptive GPU Time-Sharing for Edge Model Serving}, author = {Zhengxu Xia and Yitian Hao and Jun Duan and Chen Wang and Junchen Jiang}, year = {2023}, doi = {10.1145/3631311.3632401}, url = {https://doi.org/10.1145/3631311.3632401}, researchr = {https://researchr.org/publication/XiaHDWJ23}, cites = {0}, citedby = {0}, pages = {13-18}, booktitle = {Proceedings of the 9th International Workshop on Container Technologies and Container Clouds, WoC 2023, Bologna, Italy, December 11-15, 2023}, publisher = {ACM}, }