@inproceedings{he-etal-2021-realformer,
title = "{R}eal{F}ormer: Transformer Likes Residual Attention",
author = "He, Ruining and
Ravula, Anirudh and
Kanagal, Bhargav and
Ainslie, Joshua",
editor = "Zong, Chengqing and
Xia, Fei and
Li, Wenjie and
Navigli, Roberto",
booktitle = "Findings of the Association for Computational Linguistics: ACL-IJCNLP 2021",
month = aug,
year = "2021",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2021.findings-acl.81/",
doi = "10.18653/v1/2021.findings-acl.81",
pages = "929--943"
}
Markdown (Informal)
[RealFormer: Transformer Likes Residual Attention](https://preview.aclanthology.org/fix-sig-urls/2021.findings-acl.81/) (He et al., Findings 2021)
ACL
- Ruining He, Anirudh Ravula, Bhargav Kanagal, and Joshua Ainslie. 2021. RealFormer: Transformer Likes Residual Attention. In Findings of the Association for Computational Linguistics: ACL-IJCNLP 2021, pages 929–943, Online. Association for Computational Linguistics.