Zhihang Lin, Mingbao Lin, Luxi Lin, Rongrong Ji. Boosting Multimodal Large Language Models with Visual Tokens Withdrawal for Rapid Inference. In Toby Walsh, Julie Shah, Zico Kolter, editors, AAAI-25, Sponsored by the Association for the Advancement of Artificial Intelligence, February 25 - March 4, 2025, Philadelphia, PA, USA. pages 5334-5342, AAAI Press, 2025. [doi]
@inproceedings{LinLLJ25,
title = {Boosting Multimodal Large Language Models with Visual Tokens Withdrawal for Rapid Inference},
author = {Zhihang Lin and Mingbao Lin and Luxi Lin and Rongrong Ji},
year = {2025},
doi = {10.1609/aaai.v39i5.32567},
url = {https://doi.org/10.1609/aaai.v39i5.32567},
researchr = {https://researchr.org/publication/LinLLJ25},
cites = {0},
citedby = {0},
pages = {5334-5342},
booktitle = {AAAI-25, Sponsored by the Association for the Advancement of Artificial Intelligence, February 25 - March 4, 2025, Philadelphia, PA, USA},
editor = {Toby Walsh and Julie Shah and Zico Kolter},
publisher = {AAAI Press},
isbn = {978-1-57735-897-8},
}