Zheng-Jun Zha, Jiawei Liu, Tianhao Yang, Yongdong Zhang. Spatiotemporal-Textual Co-Attention Network for Video Question Answering. TOMCCAP, 15(2s), 2019. [doi]
@article{ZhaLYZ19, title = {Spatiotemporal-Textual Co-Attention Network for Video Question Answering}, author = {Zheng-Jun Zha and Jiawei Liu and Tianhao Yang and Yongdong Zhang}, year = {2019}, doi = {10.1145/3320061}, url = {https://doi.org/10.1145/3320061}, researchr = {https://researchr.org/publication/ZhaLYZ19}, cites = {0}, citedby = {0}, journal = {TOMCCAP}, volume = {15}, number = {2s}, }