Energon: Toward Efficient Acceleration of Transformers Using Dynamic Sparse Attention

Zhe Zhou, Junlin Liu, Zhenyu Gu, Guangyu Sun 0003. Energon: Toward Efficient Acceleration of Transformers Using Dynamic Sparse Attention. IEEE Trans. on CAD of Integrated Circuits and Systems, 42(1):136-149, 2023. [doi]

@article{ZhouLGS23,
  title = {Energon: Toward Efficient Acceleration of Transformers Using Dynamic Sparse Attention},
  author = {Zhe Zhou and Junlin Liu and Zhenyu Gu and Guangyu Sun 0003},
  year = {2023},
  doi = {10.1109/TCAD.2022.3170848},
  url = {https://doi.org/10.1109/TCAD.2022.3170848},
  researchr = {https://researchr.org/publication/ZhouLGS23},
  cites = {0},
  citedby = {0},
  journal = {IEEE Trans. on CAD of Integrated Circuits and Systems},
  volume = {42},
  number = {1},
  pages = {136-149},
}