@inproceedings{241c35190e5546e7805ffa84255908fa,
title = "FiTGAN: Content Fusion with Style Transformation for Few-shot Image Generation",
abstract = "Due to the semantic entanglement in fusion strategies or unstable training in complicated image transformations, existing few-shot image generation methods still suffer from low generation quality and diversity. To tackle the above problems, we propose a novel fusion- and transformation-based framework named content Fusion with style Transformation Generative Adversarial Network (FiTGAN) for few-shot image generation. The basic assumption is that any image consists of a collection of content-related and style-related features. FiTGAN disentangles internal representations with two independent encoders and combines the fused contents and transformed styles to generate new images. Specifically, we design a multi-scale content fusion strategy and a reparameterized style transformation mechanism to learn more fine-grained semantics without changing category-relevant attributes. Furthermore, we formulate a content reconstruction loss and a style divergence loss to provide better training stability and generation performance. Comprehensive experiments on three well-known datasets demonstrate that FiTGAN can not only produce more realistic and diverse images for few-shot image generation but also achieve better classification accuracy for downstream visual applications with limited data.",
keywords = "Content Fusion, Few-shot Image Generation, Generative Adversarial Network, Style Transformation",
author = "Yingbo Zhou and Pengyu Zhang and Yutong Ye and Zhihao Yue and Xian Wei and Mingsong Chen",
note = "Publisher Copyright: {\textcopyright} 2025 IEEE.; 2025 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2025 ; Conference date: 06-04-2025 Through 11-04-2025",
year = "2025",
doi = "10.1109/ICASSP49660.2025.10888773",
language = "英语",
series = "ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
editor = "Rao, \{Bhaskar D\} and Isabel Trancoso and Gaurav Sharma and Mehta, \{Neelesh B.\}",
booktitle = "2025 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2025 - Proceedings",
address = "美国",
}