Fine-grained Audible Video Description

Xuyang Shen, Dong Li, Jinxing Zhou, Zhen Qin, Bowen He, Xiaodong Han, Aixuan Li, Yuchao Dai, Lingpeng Kong, Meng Wang, Yu Qiao, Yiran Zhong. Fine-grained Audible Video Description. In IEEE/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2023, Vancouver, BC, Canada, June 17-24, 2023. pages 10585-10596, IEEE, 2023. [doi]

@inproceedings{ShenLZQHHLDKWQZ23,
  title = {Fine-grained Audible Video Description},
  author = {Xuyang Shen and Dong Li and Jinxing Zhou and Zhen Qin and Bowen He and Xiaodong Han and Aixuan Li and Yuchao Dai and Lingpeng Kong and Meng Wang and Yu Qiao and Yiran Zhong},
  year = {2023},
  doi = {10.1109/CVPR52729.2023.01020},
  url = {https://doi.org/10.1109/CVPR52729.2023.01020},
  researchr = {https://researchr.org/publication/ShenLZQHHLDKWQZ23},
  cites = {0},
  citedby = {0},
  pages = {10585-10596},
  booktitle = {IEEE/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2023, Vancouver, BC, Canada, June 17-24, 2023},
  publisher = {IEEE},
  isbn = {979-8-3503-0129-8},
}