@inproceedings{ma23iclr, title = {Mega: Moving Average Equipped Gated Attention}, author = {Xuezhe Ma and Chunting Zhou and Xiang Kong and Junxian He and Liangke Gui and Graham Neubig and Jonathan May and Luke Zettlemoyer}, booktitle = {International Conference on Learning Representations (ICLR)}, address = {Kigali, Rwanda}, month = {May}, url = {https://arxiv.org/abs/2209.10655}, year = {2023} }