VideoLLM-online: Online Video Large Language Model for Streaming Video

Joya Chen, Zhaoyang Lv, Shiwei Wu, Kevin Qinghong Lin, Chenan Song, Difei Gao, Jia-Wei Liu, Ziteng Gao, Dongxing Mao, Mike Zheng Shou. VideoLLM-online: Online Video Large Language Model for Streaming Video. In IEEE/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2024, Seattle, WA, USA, June 16-22, 2024. pages 18407-18418, IEEE, 2024. [doi]

@inproceedings{ChenLWLSGLGMS24,
  title = {VideoLLM-online: Online Video Large Language Model for Streaming Video},
  author = {Joya Chen and Zhaoyang Lv and Shiwei Wu and Kevin Qinghong Lin and Chenan Song and Difei Gao and Jia-Wei Liu and Ziteng Gao and Dongxing Mao and Mike Zheng Shou},
  year = {2024},
  doi = {10.1109/CVPR52733.2024.01742},
  url = {https://doi.org/10.1109/CVPR52733.2024.01742},
  researchr = {https://researchr.org/publication/ChenLWLSGLGMS24},
  cites = {0},
  citedby = {0},
  pages = {18407-18418},
  booktitle = {IEEE/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2024, Seattle, WA, USA, June 16-22, 2024},
  publisher = {IEEE},
  isbn = {979-8-3503-5300-6},
}