@inproceedings{958076134143456d9cc527ba154bf049,
title = "EDSL: An Encoder-Decoder Architecture with Symbol-Level Features for Printed Mathematical Expression Recognition",
abstract = "Printed mathematical expression recognition (PMER) aims to transcribe a printed mathematical expression image into a structural expression. The task is useful in a wide spectrum of applications, including personalized question recommendation and automatic problem solving. In this paper, we propose a new method named EDSL, shorted for an Encoder-Decoder architecture with Symbol-Level features, to recognize printed mathematical expressions from input images. Its encoder consists of a segmentation module to identify all symbols and their spatial information from the image in an unsupervised manner, and a reconstruction module to recover symbol dependencies after symbol segmentation. Furthermore, we employ a position correction attention mechanism to capture the spatial relationship between symbols, and apply a transformer model to alleviate the negative impact from long output. We conduct extensive experiments on two real datasets to verify the effectiveness and rationality of our proposed EDSL model. The experimental results illustrated that EDSL outperformed state-of-the-art methods by an accuracy margin of 3.47 \% and 4.04 \% in the two datasets, respectively.",
keywords = "encoder-decoder network, position correction attention, printed mathematical expression recognition, segmentation",
author = "Yingnan Fu and Tingting Liu and Ming Gao and Aoying Zhou",
note = "Publisher Copyright: {\textcopyright} 2023, The Author(s), under exclusive license to Springer Nature Switzerland AG.; 17th International Conference on Document Analysis and Recognition, ICDAR 2023 ; Conference date: 21-08-2023 Through 26-08-2023",
year = "2023",
doi = "10.1007/978-3-031-41676-7\_8",
language = "英语",
isbn = "9783031416750",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "134--151",
editor = "Fink, \{Gernot A.\} and Rajiv Jain and Koichi Kise and Richard Zanibbi",
booktitle = "Document Analysis and Recognition – ICDAR 2023 - 17th International Conference, Proceedings",
address = "德国",
}