@inproceedings{3a56339b61f743039f1acc46c8b31f91,
title = "Alternating language modeling for cross-lingual pre-training",
abstract = "Language model pre-training has achieved success in many natural language processing tasks. Existing methods for cross-lingual pre-training adopt Translation Language Model to predict masked words with the concatenation of the source sentence and its target equivalent. In this work, we introduce a novel cross-lingual pre-training method, called Alternating Language Modeling (ALM). It code-switches sentences of different languages rather than simple concatenation, hoping to capture the rich cross-lingual context of words and phrases. More specifically, we randomly substitute source phrases with target translations to create code-switched sentences. Then, we use these code-switched data to train ALM model to learn to predict words of different languages. We evaluate our pre-training ALM on the downstream tasks of machine translation and cross-lingual classification. Experiments show that ALM can outperform the previous pretraining methods on three benchmarks.",
author = "Jian Yang and Shuming Ma and Dongdong Zhang and Wu, \{Shuang Zhi\} and Zhoujun Li and Ming Zhou",
note = "Publisher Copyright: Copyright {\textcopyright} 2020 Association for the Advancement of Artificial Intelligence. All rights reserved.; 34th AAAI Conference on Artificial Intelligence, AAAI 2020 ; Conference date: 07-02-2020 Through 12-02-2020",
year = "2020",
language = "英语",
series = "AAAI 2020 - 34th AAAI Conference on Artificial Intelligence",
publisher = "AAAI press",
pages = "9386--9393",
booktitle = "AAAI 2020 - 34th AAAI Conference on Artificial Intelligence",
}