Yoshiaki Inoue. Queueing analysis of GPU-based inference servers with dynamic batching: A closed-form characterization. Perform. Eval., 147:102183, 2021. [doi]
@article{Inoue21-0, title = {Queueing analysis of GPU-based inference servers with dynamic batching: A closed-form characterization}, author = {Yoshiaki Inoue}, year = {2021}, doi = {10.1016/j.peva.2020.102183}, url = {https://doi.org/10.1016/j.peva.2020.102183}, researchr = {https://researchr.org/publication/Inoue21-0}, cites = {0}, citedby = {0}, journal = {Perform. Eval.}, volume = {147}, pages = {102183}, }