@inproceedings{b216236e66a340a1931e0e3329cf0ccf,
title = "DBM: Delay-sensitive Buffering Mechanism for DNN Offloading Services",
abstract = "DNN offloading has become an important supporting technology for edge intelligence. However, most of the existing works do not consider thread scheduling, which can achieve the parallelism of multiple threads in the practical distributed DNN inference system. To address this issue, we discuss the thread scheduling of the computing units participating in offloading in this paper, considering a single-core Central Processing Unit (CPU) and the Round Robin Scheduling (RRS). We deduce the relationship between the blocking of DNN inference-related threads and the Average Task Delay (ATD) and prove that an appropriate buffer setting can reduce blocking times. Theoretical analysis verifies that the buffering mechanism (DBM) can reduce the ATD significantly, and experimental results demonstrate that the DBM-improved DNN offloading can achieve a delay reduction of 14\%-71\%.",
keywords = "DNN offloading, buffering mechanism, streaming tasks",
author = "Guoliang Gao and Liantao Wu and Yang Yang and Kai Li",
note = "Publisher Copyright: {\textcopyright} 2022 IEEE.; 27th Asia-Pacific Conference on Communications, APCC 2022 ; Conference date: 19-10-2022 Through 21-10-2022",
year = "2022",
doi = "10.1109/APCC55198.2022.9943625",
language = "英语",
series = "APCC 2022 - 27th Asia-Pacific Conference on Communications: Creating Innovative Communication Technologies for Post-Pandemic Era",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "421--426",
booktitle = "APCC 2022 - 27th Asia-Pacific Conference on Communications",
address = "美国",
}