@inproceedings{1ab817e673414c6db51074fa4b2ff2bc,
title = "A hybrid model with pre-trained entity-aware transformer for relation extraction",
abstract = "Distantly supervised relation extraction is an efficient method to extract novel relational facts from unstructed text. Most previous neural methods adopt Convolutional Neural Network (CNN) or Recurrent Neural Network (RNN) to encode sentences. However, CNN is difficult to learn long-range dependencies and the parallelization of training RNN is precluded by its sequential nature. In this paper, we propose a novel hybrid model that combines Piece-wise Convolutional Neural Network (PCNN) and Entity-Aware Transformer to extract local features and learn the dependencies between distant positions jointly. The entity-aware Transformer is able to take semantic and syntax information under consideration and acquire entity-specific representations. The inner-sentence attention mechanism is then used over Transformer to alleviate the noise caused by irrelevant words. We concatenate outputs of PCNN and Transformer with word embeddings of entity mentions and then send them to the classifier, which can boost the performance of our model further. A transfer learning based strategy is applied, where the entity-aware Transformer is initialized with a priori knowledge learned from the related task of entity typing to improve the robustness of our model. The experimental results on a large-scale benchmark dataset show that our hybrid model with the pre-training strategy gets AUC score of 0.432 and outperforms the state-of-the-art baselines.",
keywords = "Relation extraction, Transfer learning, Transformer",
author = "Jinxin Yao and Min Zhang and Biyang Wang and Xianda Xu",
note = "Publisher Copyright: {\textcopyright} Springer Nature Switzerland AG 2020.; 13th International Conference on Knowledge Science, Engineering and Management, KSEM 2020 ; Conference date: 28-08-2020 Through 30-08-2020",
year = "2020",
doi = "10.1007/978-3-030-55130-8\_13",
language = "英语",
isbn = "9783030551292",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer",
pages = "148--160",
editor = "Gang Li and Shen, \{Heng Tao\} and Ye Yuan and Xiaoyang Wang and Huawen Liu and Xiang Zhao",
booktitle = "Knowledge Science, Engineering and Management - 13th International Conference, KSEM 2020, Proceedings, Part 1",
address = "德国",
}