Weizhi Wang, Rongmei Lin, Shiyang Li, Colin Lockard, Ritesh Sarkhel, Sanket Lokegaonkar, Jingbo Shang, Xifeng Yan, Nasser Zalmout, Xian Li. Train a Unified Multimodal Data Quality Classifier with Synthetic Data. In Christos Christodoulopoulos 0001, Tanmoy Chakraborty 0002, Carolyn Rose, Violet Peng, editors, Findings of the Association for Computational Linguistics: EMNLP 2025, Suzhou, China, November 4-9, 2025. pages 1972-1986, Association for Computational Linguistics, 2025. [doi]
@inproceedings{WangLLLSLSYZL25,
title = {Train a Unified Multimodal Data Quality Classifier with Synthetic Data},
author = {Weizhi Wang and Rongmei Lin and Shiyang Li and Colin Lockard and Ritesh Sarkhel and Sanket Lokegaonkar and Jingbo Shang and Xifeng Yan and Nasser Zalmout and Xian Li},
year = {2025},
url = {https://aclanthology.org/2025.findings-emnlp.104/},
researchr = {https://researchr.org/publication/WangLLLSLSYZL25},
cites = {0},
citedby = {0},
pages = {1972-1986},
booktitle = {Findings of the Association for Computational Linguistics: EMNLP 2025, Suzhou, China, November 4-9, 2025},
editor = {Christos Christodoulopoulos 0001 and Tanmoy Chakraborty 0002 and Carolyn Rose and Violet Peng},
publisher = {Association for Computational Linguistics},
isbn = {979-8-89176-335-7},
}