Yanghao Li, Chao-Yuan Wu, Haoqi Fan 0001, Karttikeya Mangalam, Bo Xiong, Jitendra Malik, Christoph Feichtenhofer. MViTv2: Improved Multiscale Vision Transformers for Classification and Detection. In IEEE/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2022, New Orleans, LA, USA, June 18-24, 2022. pages 4794-4804, IEEE, 2022. [doi]
@inproceedings{LiW0MXMF22, title = {MViTv2: Improved Multiscale Vision Transformers for Classification and Detection}, author = {Yanghao Li and Chao-Yuan Wu and Haoqi Fan 0001 and Karttikeya Mangalam and Bo Xiong and Jitendra Malik and Christoph Feichtenhofer}, year = {2022}, doi = {10.1109/CVPR52688.2022.00476}, url = {https://doi.org/10.1109/CVPR52688.2022.00476}, researchr = {https://researchr.org/publication/LiW0MXMF22}, cites = {0}, citedby = {0}, pages = {4794-4804}, booktitle = {IEEE/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2022, New Orleans, LA, USA, June 18-24, 2022}, publisher = {IEEE}, isbn = {978-1-6654-6946-3}, }