@inproceedings{1611c7e5d99d4f3b9715180f8187590a,
title = "Chimera Model of Candidate Soups for Non-Autoregressive Translation",
abstract = "Non-Autoregressive Translation (NAT) models have drawn much attention because of their excellent decoding speed. However, NAT models suffer a significant drop in translation quality compared to Autoregressive Translation (AT) models. Candidate Soups (CandiSoups) is an effective method that can fully use the different candidate translations, significantly improving the translation quality for NAT models. However, it needs to use an additional AT model for re-scoring to achieve the best performance, which slows down its inference speed and takes up more computing resources. In this paper, we propose a Chimera Model framework of CandiSoups (CMCS), which can significantly accelerate inference speed while maintaining superior performance for CandiSoups. Specifically, by modifying the decoder, we fuse the AT and NAT models to construct a Chimera Model that can perform self-rescore. Moreover, we propose a novel adaptive training method to help train Chimera Models better. Experimental results on two major benchmarks demonstrate the effectiveness of our proposed approach, which can significantly improve translation quality while maintaining the excellent inference speed.",
keywords = "Efficient Inference, Language Processing, Machine Translation, Non-autoregressive Generation",
author = "Huanran Zheng and Wei Zhu and Xiaoling Wang",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd. 2025.; 29th International Conference on Database Systems for Advanced Applications, DASFAA 2024 ; Conference date: 02-07-2024 Through 05-07-2024",
year = "2025",
doi = "10.1007/978-981-97-5779-4\_28",
language = "英语",
isbn = "9789819757787",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "416--425",
editor = "Makoto Onizuka and Jae-Gil Lee and Yongxin Tong and Chuan Xiao and Yoshiharu Ishikawa and Kejing Lu and Sihem Amer-Yahia and H.V. Jagadish",
booktitle = "Database Systems for Advanced Applications - 29th International Conference, DASFAA 2024, Proceedings",
address = "德国",
}