@inproceedings{5a274b961bbe4ce1828488861adb8cb7,
title = "Clustering with Entropy-based Recombination for Training GCNs on Large Graphs",
abstract = "With the development of deep learning methods on non-grid graph data, Graph Convolutional Networks (GCNs) are playing important roles in a wide range of scenarios. When dealing with graphs with ever-growing sizes, even if the compute capability of one GPU card is sufficient, its limited memory capacity would make the training on large graphs infeasible. Sampling methods on three levels (i.e., node-level, layer-level, and subgraph-level) have been proposed to improve the scalability of GCNs. However, there still exist drawbacks in sampling-based approaches including time-consuming sampling processes and biased node representations. To tackle these issues, we propose a novel subgraph-based sampling method considering the generalized distance of label distribution between each subgraph and the whole graph. Specifically, our method introduces two pre-steps before training: (1) partitioning all the nodes in the original graph into different clusters through an efficient clustering algorithm; (2) combining the clusters obtained in the first step into a set of bigger groups (subgraphs) based on the information entropy theory. Experiments show that our work could reserve similar label distribution to that on the whole graph and outperform SOTA models in terms of classification accuracy on different datasets. Besides, the time cost of our pre-processing procedure is acceptable compared with the time spent in training.",
keywords = "graph clustering, graph convolutional networks, label entropy, recombination",
author = "Shangwei Wu and Yingtong Xiong and Hui Liang and Chuliang Weng",
note = "Publisher Copyright: {\textcopyright} 2023 IEEE.; 23rd IEEE International Conference on Data Mining Workshops, ICDMW 2023 ; Conference date: 01-12-2023 Through 04-12-2023",
year = "2023",
doi = "10.1109/ICDMW60847.2023.00153",
language = "英语",
series = "IEEE International Conference on Data Mining Workshops, ICDMW",
publisher = "IEEE Computer Society",
pages = "1170--1177",
editor = "Jihe Wang and Yi He and Dinh, \{Thang N.\} and Christan Grant and Meikang Qiu and Witold Pedrycz",
booktitle = "Proceedings - 23rd IEEE International Conference on Data Mining Workshops, ICDMW 2023",
address = "美国",
}