@inproceedings{1e7e2b09dcbf42e5a384a6e769f88e0b,
title = "Domain-specific modelware: To make the machine learning model reusable and reproducible",
abstract = "Machine learning task is a routine process including data collection, feature engineering, model training, hyper-parameters tuning, model evaluation and model deployment. The process is usually complex, iterated and time-consuming. Commonly, researchers seldom start building the machine model from scratch. They may select some well-known and well-trained models in similar task domains as the reference models. Then they try to tune the hyper-parameters and accelerate the iteration. Thus, some models are often reused and need to be reproduced by using new training dataset. Moreover, understanding the model and the iteration is more necessary. This scenario is very similar to that of software reuse. In this poster, we propose Modelware and argue the need of Modelware to make the machine learning model reusable and reproducible. We define the Modelware which is the reused object and develop a model repository to provide the model lineage management and model visit tool. The big data for building model is managed collaboratively so that the model can be reproduced. The iteration process to obtain the final optimized model is abstracted and implemented using a lightweight workflow. Finally, we take two different classification tasks as the demonstration.",
keywords = "Machine learning, Model repository, Model specification, Modelware, Reproduce, Reuse",
author = "Hui Zhao and Jimin Liang and Xuezhen Yin and Lingfeng Yang and Peili Yang and Yuhang Wang",
note = "Publisher Copyright: {\textcopyright} 2018 ACM.; 12th ACM/IEEE International Symposium on Empirical Software Engineering and Measurement, ESEM 2018 ; Conference date: 11-10-2018 Through 12-10-2018",
year = "2018",
month = oct,
day = "11",
doi = "10.1145/3239235.3267439",
language = "英语",
series = "International Symposium on Empirical Software Engineering and Measurement",
publisher = "IEEE Computer Society",
booktitle = "Proceedings of the 12th ACM/IEEE International Symposium on Empirical Software Engineering and Measurement, ESEM 2018",
address = "美国",
}