Cordelia Schmid. Do you see what I see?: Large-scale Learning from Multimodal Videos. In Heng Tao Shen, Yueting Zhuang, John R. Smith, Yang Yang, Pablo Cesar, Florian Metze, Balakrishnan Prabhakaran, editors, MM '21: ACM Multimedia Conference, Virtual Event, China, October 20 - 24, 2021. pages 2643, ACM, 2021. [doi]
@inproceedings{Schmid21-1, title = {Do you see what I see?: Large-scale Learning from Multimodal Videos}, author = {Cordelia Schmid}, year = {2021}, doi = {10.1145/3474085.3476967}, url = {https://doi.org/10.1145/3474085.3476967}, researchr = {https://researchr.org/publication/Schmid21-1}, cites = {0}, citedby = {0}, pages = {2643}, booktitle = {MM '21: ACM Multimedia Conference, Virtual Event, China, October 20 - 24, 2021}, editor = {Heng Tao Shen and Yueting Zhuang and John R. Smith and Yang Yang and Pablo Cesar and Florian Metze and Balakrishnan Prabhakaran}, publisher = {ACM}, isbn = {978-1-4503-8651-7}, }