LOCP: Latency-optimized channel pruning for CNN inference acceleration on GPUs

Yonghua Zhang, Hongxu Jiang, Yuting Zhu, Runhua Zhang, Yongxiang Cao, Chenhui Zhu, Wei Wang, Dong Dong, Xiaobin Li. LOCP: Latency-optimized channel pruning for CNN inference acceleration on GPUs. The Journal of Supercomputing, 79(13):14313-14341, September 2023. [doi]

@article{ZhangJZZCZWDL23,
  title = {LOCP: Latency-optimized channel pruning for CNN inference acceleration on GPUs},
  author = {Yonghua Zhang and Hongxu Jiang and Yuting Zhu and Runhua Zhang and Yongxiang Cao and Chenhui Zhu and Wei Wang and Dong Dong and Xiaobin Li},
  year = {2023},
  month = {September},
  doi = {10.1007/s11227-023-05212-4},
  url = {https://doi.org/10.1007/s11227-023-05212-4},
  researchr = {https://researchr.org/publication/ZhangJZZCZWDL23},
  cites = {0},
  citedby = {0},
  journal = {The Journal of Supercomputing},
  volume = {79},
  number = {13},
  pages = {14313-14341},
}