PVT v2: Improved baselines with Pyramid Vision Transformer

Wenhai Wang, Enze Xie, Xiang Li 0028, Deng-Ping Fan, Kaitao Song, Ding Liang, Tong Lu, Ping Luo 0002, Ling Shao 0001. PVT v2: Improved baselines with Pyramid Vision Transformer. Computational Visual Media, 8(3):415-424, 2022. [doi]

@article{WangXLFSLLLS22,
  title = {PVT v2: Improved baselines with Pyramid Vision Transformer},
  author = {Wenhai Wang and Enze Xie and Xiang Li 0028 and Deng-Ping Fan and Kaitao Song and Ding Liang and Tong Lu and Ping Luo 0002 and Ling Shao 0001},
  year = {2022},
  doi = {10.1007/s41095-022-0274-8},
  url = {https://doi.org/10.1007/s41095-022-0274-8},
  researchr = {https://researchr.org/publication/WangXLFSLLLS22},
  cites = {0},
  citedby = {0},
  journal = {Computational Visual Media},
  volume = {8},
  number = {3},
  pages = {415-424},
}