Jiajun Wei, Hongjian Zhan, Yue Lu 0001, Xiao Tu, Bing Yin, Cong Liu, Umapada Pal 0001. Image as a Language: Revisiting Scene Text Recognition via Balanced, Unified and Synchronized Vision-Language Reasoning Network. In Michael J. Wooldridge, Jennifer G. Dy, Sriraam Natarajan, editors, Thirty-Eigth AAAI Conference on Artificial Intelligence, AAAI 2024, Thirty-Sixth Conference on Innovative Applications of Artificial Intelligence, IAAI 2024, Fourteenth Symposium on Educational Advances in Artificial Intelligence, EAAI 2014, February 20-27, 2024, Vancouver, Canada. pages 5885-5893, AAAI Press, 2024. [doi]
@inproceedings{WeiZ0TYL024, title = {Image as a Language: Revisiting Scene Text Recognition via Balanced, Unified and Synchronized Vision-Language Reasoning Network}, author = {Jiajun Wei and Hongjian Zhan and Yue Lu 0001 and Xiao Tu and Bing Yin and Cong Liu and Umapada Pal 0001}, year = {2024}, doi = {10.1609/aaai.v38i6.28402}, url = {https://doi.org/10.1609/aaai.v38i6.28402}, researchr = {https://researchr.org/publication/WeiZ0TYL024}, cites = {0}, citedby = {0}, pages = {5885-5893}, booktitle = {Thirty-Eigth AAAI Conference on Artificial Intelligence, AAAI 2024, Thirty-Sixth Conference on Innovative Applications of Artificial Intelligence, IAAI 2024, Fourteenth Symposium on Educational Advances in Artificial Intelligence, EAAI 2014, February 20-27, 2024, Vancouver, Canada}, editor = {Michael J. Wooldridge and Jennifer G. Dy and Sriraam Natarajan}, publisher = {AAAI Press}, }