@inproceedings{5c452b19732c47a7bc0e90a0035c25f7,
title = "TaskSum: Task-Driven Extractive Text Summarization for Long News Documents Based on Reinforcement Learning",
abstract = "A popular and state-of-the-art family of extractive summarization is to explore pre-trained language models through reinforcement learning (RL). Despite gaining promising results, existing RL-based methods suffer from three drawbacks. First, they often adopt sparse reward signal schemes, which only give rewards to some of the extracted sentences, and result in neglecting salient sentences. Second, they often deem summarization as an independent task and neglect the latent connections existing between summarization and other downstream tasks, that could provide insightful hints to guide the upstream summarization task in return. Third, the length of input sequences in most summarization methods is restricted by the utilized pre-trained language models. To address these problems, we propose a novel RL-based Seq2Seq extractive summarization model, namely TaskSum, which combines extractive text summarization with multiple associated tasks via a dense reward signal scheme. Moreover, we implement a BERT-based hierarchical encoder to effectively encode documents of arbitrary length. Empirical results demonstrate that TaskSum can overcome the above-mentioned drawbacks of existing RL-based summarization methods and achieve significantly better results for long documents.",
keywords = "Extractive summarization, Reinforcement learning",
author = "Moming Tang and Dawei Cheng and Cen Chen and Yuqi Liang and Yifeng Luo and Weining Qian",
note = "Publisher Copyright: {\textcopyright} 2022, The Author(s), under exclusive license to Springer Nature Switzerland AG.; 27th International Conference on Database Systems for Advanced Applications, DASFAA 2022 ; Conference date: 11-04-2022 Through 14-04-2022",
year = "2022",
doi = "10.1007/978-3-031-00129-1\_25",
language = "英语",
isbn = "9783031001284",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "306--313",
editor = "Arnab Bhattacharya and \{Lee Mong Li\}, Janice and Divyakant Agrawal and Reddy, \{P. Krishna\} and Mukesh Mohania and Anirban Mondal and Vikram Goyal and \{Uday Kiran\}, Rage",
booktitle = "Database Systems for Advanced Applications - 27th International Conference, DASFAA 2022, Proceedings",
address = "德国",
}