@inproceedings{ce0b585d7890407582039c4f35323e33,
title = "OnMKD: An Online Mutual Knowledge Distillation Framework for Passage Retrieval",
abstract = "Dense passage retriever recalls a set of relevant passages from a large corpus according to a natural language question. The dual-encoder architecture is prevalent in dense passage retrievers, which is based on large-scale pre-trained language models (PLMs). However, existing PLMs usually have thick structures and bulky parameters, resulting in large memory and time consumption. To overcome the limitation of PLMs, in this paper we apply online distillation to passage retrieval and propose an Online Mutual Knowledge Distillation framework (OnMKD). Specifically, we obtain a lightweight retriever by simultaneously updating two peer networks with the same dual-encoder structure and different initial parameters, named Online Mutual Knowledge Refinement. To further interact with the latent knowledge of intermediate layers, we utilize a novel cross-wise contrastive loss to alternate the representation of questions and passages. Experimental results indicate that our framework outperforms other small baselines with the same number of layers on multiple QA benchmarks. Compared to the heavy PLMs, OnMKD significantly accelerates the inference process and reduces storage requirements with only a slight sacrifice in performance.",
keywords = "Cross-wise contrastive learning, Mutual learning, Online knowledge distillation, Passage retrieval",
author = "Jiali Deng and Dongyang Li and Taolin Zhang and Xiaofeng He",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2023.; 12th National CCF Conference on Natural Language Processing and Chinese Computing, NLPCC 2023 ; Conference date: 12-10-2023 Through 15-10-2023",
year = "2023",
doi = "10.1007/978-3-031-44696-2\_56",
language = "英语",
isbn = "9783031446955",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "719--731",
editor = "Fei Liu and Nan Duan and Qingting Xu and Yu Hong",
booktitle = "Natural Language Processing and Chinese Computing - 12th National CCF Conference, NLPCC 2023, Proceedings",
address = "德国",
}