@inproceedings{332ebd057fb143cabf22b9dc2151c3ca,
title = "Filter-GLAT: Filter Glanced Decoder Output for Non-autoregressive Transformer",
abstract = "Non-autoregressive machine translation model has achieved significantly faster inference speed compared to the autoregressive translation model. However, its translation quality is degraded compared to the autoregressive translation model. Despite numerous advanced methods are proposed to improve the translation quality of the non-autoregressive translation model, achieving the desired trade-off between quality and efficiency is difficult. In this paper, a Filter Glanced Transformer, named Filter-GLAT, is proposed to tackle this problem. It first refines the glance sampling learning strategy, followed by adopting the Filter learning strategy during training, substantially enhancing the translation quality. As for the inference speed, Filter-GLAT generates predictions with only a single decoding pass, maintaining high speed. Moreover, the Filter learning strategy helps the model narrow the gap between training and inference procedures by modifying the training process. Extensive experiments over translation benchmarks (WMT{\textquoteright}14 EN-DE and WMT{\textquoteright}16 EN-RO) demonstrate that Filter-GLAT almost strikes the best balance between translation quality and speed.",
keywords = "Efficient Inference, Learning Strategy, Neural Machine Translation, Non-autoregressive Generation",
author = "Zichun Wang and Huanran Zheng and Xiaoling Wang",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd. 2024.; 8th Asia-Pacific Web and Web-Age Information Management Joint International Conference on Web and Big Data, APWeb-WAIM 2024 ; Conference date: 30-08-2024 Through 01-09-2024",
year = "2024",
doi = "10.1007/978-981-97-7232-2\_5",
language = "英语",
isbn = "9789819772315",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "59--73",
editor = "Wenjie Zhang and Zhengyi Yang and Xiaoyang Wang and Anthony Tung and Zhonglong Zheng and Hongjie Guo",
booktitle = "Web and Big Data - 8th International Joint Conference, APWeb-WAIM 2024, Proceedings",
address = "德国",
}