Yupan Huang, Zhaoyang Zeng, Yutong Lu. Be Specific, Be Clear: Bridging Machine and Human Captions by Scene-Guided Transformer. In Bei Liu 0001, Jianlong Fu, Shizhe Chen, Qin Jin, Alexander G. Hauptmann, Yong Rui, editors, MMPT@ICMR2021: Proceedings of the 2021 Workshop on Multi-Modal Pre-Training for Multimedia Understanding, Taipei, Taiwan, August 21, 2021. pages 4-13, ACM, 2021. [doi]
@inproceedings{HuangZL21-1, title = {Be Specific, Be Clear: Bridging Machine and Human Captions by Scene-Guided Transformer}, author = {Yupan Huang and Zhaoyang Zeng and Yutong Lu}, year = {2021}, doi = {10.1145/3463945.3469054}, url = {https://doi.org/10.1145/3463945.3469054}, researchr = {https://researchr.org/publication/HuangZL21-1}, cites = {0}, citedby = {0}, pages = {4-13}, booktitle = {MMPT@ICMR2021: Proceedings of the 2021 Workshop on Multi-Modal Pre-Training for Multimedia Understanding, Taipei, Taiwan, August 21, 2021}, editor = {Bei Liu 0001 and Jianlong Fu and Shizhe Chen and Qin Jin and Alexander G. Hauptmann and Yong Rui}, publisher = {ACM}, isbn = {978-1-4503-8530-5}, }