@inproceedings{f0a488b080034e429765574530ff5ce3,
title = "Global Meets Local: Effective Multi-Label Image Classification via Category-Aware Weak Supervision",
abstract = "Multi-label image classification, which can be categorized into label-dependency and region-based methods, is a challenging problem due to the complex underlying object layouts. Although region-based methods are less likely to encounter issues with model generalizability than label-dependency methods, they often generate hundreds of meaningless or noisy proposals with non-discriminative information, and the contextual dependency among the localized regions is often ignored or over-simplified. This paper builds a unified framework to perform effective noisy-proposal suppression and to interact between global and local features for robust feature learning. Specifically, we propose category-Aware weak supervision to concentrate on non-existent categories so as to provide deterministic information for local feature learning, restricting the local branch to focus on more high-quality regions of interest. Moreover, we develop a cross-granularity attention module to explore the complementary information between global and local features, which can build the high-order feature correlation containing not only global-To-local, but also local-To-local relations. Both advantages guarantee a boost in the performance of the whole network. Extensive experiments on two large-scale datasets (MS-COCO and VOC 2007) demonstrate that our framework achieves superior performance over state-of-The-Art methods.",
keywords = "image recognition, multi-label classification, region proposal, self-Attention, weak supervision",
author = "Jiawei Zhan and Jun Liu and Wei Tang and Guannan Jiang and Xi Wang and Gao, \{Bin Bin\} and Tianliang Zhang and Wenlong Wu and Wei Zhang and Chengjie Wang and Yuan Xie",
note = "Publisher Copyright: {\textcopyright} 2022 ACM.; 30th ACM International Conference on Multimedia, MM 2022 ; Conference date: 10-10-2022 Through 14-10-2022",
year = "2022",
month = oct,
day = "10",
doi = "10.1145/3503161.3547834",
language = "英语",
series = "MM 2022 - Proceedings of the 30th ACM International Conference on Multimedia",
publisher = "Association for Computing Machinery, Inc",
pages = "6318--6326",
booktitle = "MM 2022 - Proceedings of the 30th ACM International Conference on Multimedia",
}