Reproducing Whisper-Style Training Using An Open-Source Toolkit And Publicly Available Data

Yifan Peng, Jinchuan Tian, Brian Yan, Dan Berrebbi, Xuankai Chang, Xinjian Li, Jiatong Shi, Siddhant Arora, William Chen, Roshan S. Sharma, Wangyou Zhang, Yui Sudo, Muhammad Shakeel 0001, Jee-weon Jung, Soumi Maiti, Shinji Watanabe 0001. Reproducing Whisper-Style Training Using An Open-Source Toolkit And Publicly Available Data. In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2023, Taipei, Taiwan, December 16-20, 2023. pages 1-8, IEEE, 2023. [doi]

@inproceedings{PengTYBCLSACSZSSJMW23,
  title = {Reproducing Whisper-Style Training Using An Open-Source Toolkit And Publicly Available Data},
  author = {Yifan Peng and Jinchuan Tian and Brian Yan and Dan Berrebbi and Xuankai Chang and Xinjian Li and Jiatong Shi and Siddhant Arora and William Chen and Roshan S. Sharma and Wangyou Zhang and Yui Sudo and Muhammad Shakeel 0001 and Jee-weon Jung and Soumi Maiti and Shinji Watanabe 0001},
  year = {2023},
  doi = {10.1109/ASRU57964.2023.10389676},
  url = {https://doi.org/10.1109/ASRU57964.2023.10389676},
  researchr = {https://researchr.org/publication/PengTYBCLSACSZSSJMW23},
  cites = {0},
  citedby = {0},
  pages = {1-8},
  booktitle = {IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2023, Taipei, Taiwan, December 16-20, 2023},
  publisher = {IEEE},
  isbn = {979-8-3503-0689-7},
}