@inproceedings{32a00cf8d7144097907781c9d1b910d8,
title = "Incorporating Typological Features into Language Selection for Multilingual Neural Machine Translation",
abstract = "In this paper, we propose to use rich semantic and typological information of languages to improve the language selection method for multilingual NMT. In particular, we first use a graph-based model to output the most semantic similarity languages; then, a random forest model is built which integrates features such as data size, language family, word formation, morpheme overlap, word order, POS tag and syntax similarity together to predict the final target language(s). Experimental results on several datasets show that our method achieves consistent improvements over existing approaches both on language selection and multilingual NMT.",
keywords = "Language selection, Neural machine translation, Typological feature",
author = "Chenggang Mi and Shaolin Zhu and Yi Fan and Lei Xie",
note = "Publisher Copyright: {\textcopyright} 2021, Springer Nature Switzerland AG.; 5th International Joint Conference on Asia-Pacific Web and Web-Age Information Management, APWeb-WAIM 2021 ; Conference date: 23-08-2021 Through 25-08-2021",
year = "2021",
doi = "10.1007/978-3-030-85896-4_27",
language = "英语",
isbn = "9783030858957",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "348--357",
editor = "U, {Leong Hou} and Marc Spaniol and Yasushi Sakurai and Junying Chen",
booktitle = "Web and Big Data - 5th International Joint Conference, APWeb-WAIM 2021, Proceedings",
}