[inline-graphic not available: see fulltext]VideoAgent: A Memory-Augmented Multimodal Agent for Video Understanding

researchr

You are not signed in
Sign in
Sign up

Yue Fan, Xiaojian Ma, Rujie Wu, Yuntao Du 0001, Jiaqi Li, Zhi Gao, Qing Li 0003. [inline-graphic not available: see fulltext]VideoAgent: A Memory-Augmented Multimodal Agent for Video Understanding. In Ales Leonardis, Elisa Ricci 0001, Stefan Roth 0001, Olga Russakovsky, Torsten Sattler, Gül Varol, editors, Computer Vision - ECCV 2024 - 18th European Conference, Milan, Italy, September 29-October 4, 2024, Proceedings, Part XXII. Volume 15080 of Lecture Notes in Computer Science, pages 75-92, Springer, 2024. [doi]

@inproceedings{FanMWDLGL24,
  title = {[inline-graphic not available: see fulltext]VideoAgent: A Memory-Augmented Multimodal Agent for Video Understanding},
  author = {Yue Fan and Xiaojian Ma and Rujie Wu and Yuntao Du 0001 and Jiaqi Li and Zhi Gao and Qing Li 0003},
  year = {2024},
  doi = {10.1007/978-3-031-72670-5_5},
  url = {https://doi.org/10.1007/978-3-031-72670-5_5},
  researchr = {https://researchr.org/publication/FanMWDLGL24},
  cites = {0},
  citedby = {0},
  pages = {75-92},
  booktitle = {Computer Vision - ECCV 2024 - 18th European Conference, Milan, Italy, September 29-October 4, 2024, Proceedings, Part XXII},
  editor = {Ales Leonardis and Elisa Ricci 0001 and Stefan Roth 0001 and Olga Russakovsky and Torsten Sattler and Gül Varol},
  volume = {15080},
  series = {Lecture Notes in Computer Science},
  publisher = {Springer},
  isbn = {978-3-031-72670-5},
}

External Links

Cite Key

Statistics

PDF

Researchr

[inline-graphic not available: see fulltext]VideoAgent: A Memory-Augmented Multimodal Agent for Video Understanding