@inproceedings{ea74f8db250e4ce29dea4bd75c250b1a,
title = "Adversarial Self-Attention for Language Understanding",
abstract = "Deep neural models (e.g. Transformer) naturally learn spurious features, which create a “shortcut” between the labels and inputs, thus impairing the generalization and robustness. This paper advances the self-attention mechanism to its robust variant for Transformer-based pre-trained language models (e.g. BERT). We propose Adversarial Self-Attention mechanism (ASA), which adversarially biases the attentions to effectively suppress the model reliance on features (e.g. specific keywords) and encourage its exploration of broader semantics. We conduct a comprehensive evaluation across a wide range of tasks for both pre-training and fine-tuning stages. For pre-training, ASA unfolds remarkable performance gains compared to naive training for longer steps. For fine-tuning, ASA-empowered models outweigh naive models by a large margin considering both generalization and robustness.",
author = "Hongqiu Wu and Ruixue Ding and Hai Zhao and Pengjun Xie and Fei Huang and Min Zhang",
note = "Publisher Copyright: Copyright {\textcopyright} 2023, Association for the Advancement of Artificial Intelligence (www.aaai.org). All rights reserved.; 37th AAAI Conference on Artificial Intelligence, AAAI 2023 ; Conference date: 07-02-2023 Through 14-02-2023",
year = "2023",
month = jun,
day = "27",
doi = "10.1609/aaai.v37i11.26608",
language = "英语",
series = "Proceedings of the 37th AAAI Conference on Artificial Intelligence, AAAI 2023",
publisher = "AAAI press",
pages = "13727--13735",
editor = "Brian Williams and Yiling Chen and Jennifer Neville",
booktitle = "AAAI-23 Technical Tracks 11",
}