Rongzhi Zhang, Jiaming Shen, Tianqi Liu 0002, Haorui Wang, Zhen Qin 0001, Feng Han, Jialu Liu, Simon Baumgartner, Michael Bendersky, Chao Zhang. PLaD: Preference-based Large Language Model Distillation with Pseudo-Preference Pairs. In Lun-Wei Ku, Andre Martins, Vivek Srikumar, editors, Findings of the Association for Computational Linguistics, ACL 2024, Bangkok, Thailand and virtual meeting, August 11-16, 2024. pages 15623-15636, Association for Computational Linguistics, 2024. [doi]
@inproceedings{ZhangS0W0HLBBZ24, title = {PLaD: Preference-based Large Language Model Distillation with Pseudo-Preference Pairs}, author = {Rongzhi Zhang and Jiaming Shen and Tianqi Liu 0002 and Haorui Wang and Zhen Qin 0001 and Feng Han and Jialu Liu and Simon Baumgartner and Michael Bendersky and Chao Zhang}, year = {2024}, url = {https://aclanthology.org/2024.findings-acl.923}, researchr = {https://researchr.org/publication/ZhangS0W0HLBBZ24}, cites = {0}, citedby = {0}, pages = {15623-15636}, booktitle = {Findings of the Association for Computational Linguistics, ACL 2024, Bangkok, Thailand and virtual meeting, August 11-16, 2024}, editor = {Lun-Wei Ku and Andre Martins and Vivek Srikumar}, publisher = {Association for Computational Linguistics}, isbn = {979-8-89176-099-8}, }