@inproceedings{4c5fd4d8a78b44cd824b4986fd978634,
title = "IRMP: From printed forms to relational data model",
abstract = "Massive printed forms are inevitably existing in daily business processes, which makes it di cult for computers to deal with. Thus, there is an emerging requirement to automatically convert these print-outs into computer understandable data, stored as structured data models for further applications. To cater to this need, we rst extract table lines and texts from printed forms and convert them into RDF models. Then the heterogeneous models extracted from di erent instances are connected based on string and lexical similarity. Finally according to the mapping rules we automatically convert the connected models into the relational data model, which builds the foundation for subsequent use such as database generation and linked data interconnection. Multiple experiments using real resumes as dataset as well as a case study are conducted to verify the framework. And we construct a prototype system, iRMP(intelligent Resource Management Platform), to demonstrate the practicability and e ectiveness of the approach.",
keywords = "Data extraction, Form recognition, Model connection, Relational data model",
author = "Jun Zhou and Han Yu and Cheng Xie and Hongming Cai and Lihong Jiang",
note = "Publisher Copyright: {\textcopyright} 2016 IEEE.; 18th IEEE International Conference on High Performance Computing and Communications, 14th IEEE International Conference on Smart City and 2nd IEEE International Conference on Data Science and Systems, HPCC/SmartCity/DSS 2016 ; Conference date: 12-12-2016 Through 14-12-2016",
year = "2017",
month = jan,
day = "20",
doi = "10.1109/HPCC-SmartCity-DSS.2016.0199",
language = "英语",
series = "Proceedings - 18th IEEE International Conference on High Performance Computing and Communications, 14th IEEE International Conference on Smart City and 2nd IEEE International Conference on Data Science and Systems, HPCC/SmartCity/DSS 2016",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "1394--1401",
editor = "Yang, \{Laurence T.\} and Jinjun Chen",
booktitle = "Proceedings - 18th IEEE International Conference on High Performance Computing and Communications, 14th IEEE International Conference on Smart City and 2nd IEEE International Conference on Data Science and Systems, HPCC/SmartCity/DSS 2016",
address = "美国",
}