Mozhgan Nasr Azadani, James Riddell, Sean Sedwards, Krzysztof Czarnecki 0001. Rethinking the Mixture of Vision Encoders Paradigm for Enhanced Visual Understanding in Multimodal LLMs. Trans. Mach. Learn. Res., 2026, 2026. [doi]
@article{AzadaniRSC26,
title = {Rethinking the Mixture of Vision Encoders Paradigm for Enhanced Visual Understanding in Multimodal LLMs},
author = {Mozhgan Nasr Azadani and James Riddell and Sean Sedwards and Krzysztof Czarnecki 0001},
year = {2026},
url = {https://openreview.net/forum?id=tgnTVmRybs},
researchr = {https://researchr.org/publication/AzadaniRSC26},
cites = {0},
citedby = {0},
journal = {Trans. Mach. Learn. Res.},
volume = {2026},
}