Junchao Zhang, Yuxin Peng. Hierarchical Vision-Language Alignment for Video Captioning. In Ioannis Kompatsiaris, Benoit Huet, Vasileios Mezaris, Cathal Gurrin, Wen-Huang Cheng, Stefanos Vrochidis, editors, MultiMedia Modeling - 25th International Conference, MMM 2019, Thessaloniki, Greece, January 8-11, 2019, Proceedings, Part I. Volume 11295 of Lecture Notes in Computer Science, pages 42-54, Springer, 2019. [doi]
@inproceedings{ZhangP19, title = {Hierarchical Vision-Language Alignment for Video Captioning}, author = {Junchao Zhang and Yuxin Peng}, year = {2019}, doi = {10.1007/978-3-030-05710-7_4}, url = {https://doi.org/10.1007/978-3-030-05710-7_4}, researchr = {https://researchr.org/publication/ZhangP19}, cites = {0}, citedby = {0}, pages = {42-54}, booktitle = {MultiMedia Modeling - 25th International Conference, MMM 2019, Thessaloniki, Greece, January 8-11, 2019, Proceedings, Part I}, editor = {Ioannis Kompatsiaris and Benoit Huet and Vasileios Mezaris and Cathal Gurrin and Wen-Huang Cheng and Stefanos Vrochidis}, volume = {11295}, series = {Lecture Notes in Computer Science}, publisher = {Springer}, isbn = {978-3-030-05710-7}, }