SLM: Bridge the Thin Gap Between Speech and Text Foundation Models

Mingqiu Wang, Wei Han, Izhak Shafran, Zelin Wu, Chung-Cheng Chiu, Yuan Cao 0007, Nanxin Chen, Yu Zhang 0033, Hagen Soltau, Paul K. Rubenstein, Lukas Zilka, Dian Yu, Golan Pundak, Nikhil Siddhartha, Johan Schalkwyk, Yonghui Wu. SLM: Bridge the Thin Gap Between Speech and Text Foundation Models. In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2023, Taipei, Taiwan, December 16-20, 2023. pages 1-8, IEEE, 2023. [doi]

@inproceedings{WangHSWCCCZSRZYPSSW23,
  title = {SLM: Bridge the Thin Gap Between Speech and Text Foundation Models},
  author = {Mingqiu Wang and Wei Han and Izhak Shafran and Zelin Wu and Chung-Cheng Chiu and Yuan Cao 0007 and Nanxin Chen and Yu Zhang 0033 and Hagen Soltau and Paul K. Rubenstein and Lukas Zilka and Dian Yu and Golan Pundak and Nikhil Siddhartha and Johan Schalkwyk and Yonghui Wu},
  year = {2023},
  doi = {10.1109/ASRU57964.2023.10389703},
  url = {https://doi.org/10.1109/ASRU57964.2023.10389703},
  researchr = {https://researchr.org/publication/WangHSWCCCZSRZYPSSW23},
  cites = {0},
  citedby = {0},
  pages = {1-8},
  booktitle = {IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2023, Taipei, Taiwan, December 16-20, 2023},
  publisher = {IEEE},
  isbn = {979-8-3503-0689-7},
}