@inproceedings{def62d7396fe461ca8414a3d40f5b9ad,
title = "StreamRec: A Recommendation Inference System with CUDA Stream Acceleration",
abstract = "Deep learning based recommendation models are widely used in various applications. There are often dozens of groups of sparse features in the input of the recommendation model, and each group of features computes the embedding layer independently and applies a separate feature interaction. However, current deep learning frameworks sequentially schedule the execution of all operators into a single CUDA computational stream. Therefore, we propose StreamRec, a stream-based parallel inference system. It assigns the processing of individual features to different CUDA streams for parallel execution. Besides, StreamRec is able to visualize the execution performance and operators assignment results on the web.",
keywords = "CUDA stream, Recommendation, Visualization",
author = "Yuean Niu and Zhizhen Xu and Yushu Sun and Chen Xu",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd. 2024.; 29th International Conference on Database Systems for Advanced Applications, DASFAA 2024 ; Conference date: 02-07-2024 Through 05-07-2024",
year = "2024",
doi = "10.1007/978-981-97-5575-2\_43",
language = "英语",
isbn = "9789819755745",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "480--483",
editor = "Makoto Onizuka and Jae-Gil Lee and Yongxin Tong and Chuan Xiao and Yoshiharu Ishikawa and Kejing Lu and Sihem Amer-Yahia and H.V. Jagadish",
booktitle = "Database Systems for Advanced Applications - 29th International Conference, DASFAA 2024, Proceedings",
address = "德国",
}