@inproceedings{13ab029ffe7e4294b74919de418ca69c,
title = "Removing Input Confounder for Translation Quality Estimation via a Causal Motivated Method",
abstract = "Most state-of-the-art QE systems built upon neural networks have achieved promising performances on benchmark datasets. However, the performance of these methods can be easily influenced by the inherent features of the model input, such as the length of input sequence or the number of unseen tokens. In this paper, we introduce a causal inference based method to eliminate the negative impact caused by the characters of the input for a QE system. Specifically, we propose an iterative denoising framework for multiple confounding features. The confounder elimination operation at each iteration step is implemented by a Half-Sibling Regression based method. We conduct our experiments on the official datasets and submissions from WMT 2020 Quality Estimation Shared Task of Sentence-Level Direct Assessment. Experimental results show that the denoised QE results gain better Pearson{\textquoteright}s correlation scores with human assessments compared to the original submissions.",
keywords = "Causal inference, Machine translation, Quality estimation",
author = "Xuewen Shi and Heyan Huang and Ping Jian and Tang, {Yi Kun}",
note = "Publisher Copyright: {\textcopyright} 2021, Springer Nature Switzerland AG.; 5th International Joint Conference on Asia-Pacific Web and Web-Age Information Management, APWeb-WAIM 2021 ; Conference date: 23-08-2021 Through 25-08-2021",
year = "2021",
doi = "10.1007/978-3-030-85896-4_28",
language = "English",
isbn = "9783030858957",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "358--364",
editor = "U, {Leong Hou} and Marc Spaniol and Yasushi Sakurai and Junying Chen",
booktitle = "Web and Big Data - 5th International Joint Conference, APWeb-WAIM 2021, Proceedings",
address = "Germany",
}