@inproceedings{cb2ecd84c4d7486f95dd3d0db0f89c4d,
title = "ScriptNet: A Two Stream CNN for Script Identification in Camera-Based Document Images",
abstract = "Script identification is an essential part of a document image analysis system, since documents written in different scripts may undergo different processing methods. In this paper, we address the issue of script identification in camera-based document images, which is challenging since the camera-based document images are often subject to perspective distortions, uneven illuminations, etc. We propose a novel network called ScriptNet that is composed of two streams: spatial stream and visual stream. The spatial stream captures the spatial dependencies within the image, while the visual stream describes the appearance of the image. The two streams are then fused in the network, which can be trained in an end-to-end manner. Extensive experiments demonstrate the effectiveness of the proposed approach. The two streams have been shown to be complementary to each other. An accuracy of 99.1 \% has been achieved by our proposed network, which compares favourably with state-of-the-art methods. Besides, the proposed network achieves promising results even when it is trained with non-camera-based document images and tested on camera-based document images.",
keywords = "Script identification, ScriptNet, camera-based document images, spatial stream, visual stream",
author = "Minzhen Deng and Hui Ma and Li Liu and Taorong Qiu and Yue Lu and Suen, \{Ching Y.\}",
note = "Publisher Copyright: {\textcopyright} 2023, The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd.; 29th International Conference on Neural Information Processing, ICONIP 2022 ; Conference date: 22-11-2022 Through 26-11-2022",
year = "2023",
doi = "10.1007/978-981-99-1645-0\_2",
language = "英语",
isbn = "9789819916443",
series = "Communications in Computer and Information Science",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "14--25",
editor = "Mohammad Tanveer and Sonali Agarwal and Seiichi Ozawa and Asif Ekbal and Adam Jatowt",
booktitle = "Neural Information Processing - 29th International Conference, ICONIP 2022, Proceedings",
address = "德国",
}