A multimodal attention fusion network with a dynamic vocabulary for TextVQA

Jiajia Wu, Jun Du, Fengren Wang, Chen Yang, Xinzhe Jiang, Jinshui Hu, Bing Yin, Jianshu Zhang, Lirong Dai 0001. A multimodal attention fusion network with a dynamic vocabulary for TextVQA. Pattern Recognition, 122:108214, 2022. [doi]

@article{WuDWYJHYZD22,
  title = {A multimodal attention fusion network with a dynamic vocabulary for TextVQA},
  author = {Jiajia Wu and Jun Du and Fengren Wang and Chen Yang and Xinzhe Jiang and Jinshui Hu and Bing Yin and Jianshu Zhang and Lirong Dai 0001},
  year = {2022},
  doi = {10.1016/j.patcog.2021.108214},
  url = {https://doi.org/10.1016/j.patcog.2021.108214},
  researchr = {https://researchr.org/publication/WuDWYJHYZD22},
  cites = {0},
  citedby = {0},
  journal = {Pattern Recognition},
  volume = {122},
  pages = {108214},
}