Chia-Wen Kuo, Zsolt Kira. Beyond a Pre-Trained Object Detector: Cross-Modal Textual and Visual Context for Image Captioning. In IEEE/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2022, New Orleans, LA, USA, June 18-24, 2022. pages 17948-17958, IEEE, 2022. [doi]
@inproceedings{KuoK22-2, title = {Beyond a Pre-Trained Object Detector: Cross-Modal Textual and Visual Context for Image Captioning}, author = {Chia-Wen Kuo and Zsolt Kira}, year = {2022}, doi = {10.1109/CVPR52688.2022.01744}, url = {https://doi.org/10.1109/CVPR52688.2022.01744}, researchr = {https://researchr.org/publication/KuoK22-2}, cites = {0}, citedby = {0}, pages = {17948-17958}, booktitle = {IEEE/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2022, New Orleans, LA, USA, June 18-24, 2022}, publisher = {IEEE}, isbn = {978-1-6654-6946-3}, }