@inproceedings{1e1951d2aafa42f4a5e33d7c77dee510,
title = "ITVTON: Virtual Try-On Diffusion Transformer Based on Integrated Image and Text",
abstract = "Virtual try-on, which aims to seamlessly fit garments onto person images, has recently seen significant progress with diffusion-based models. However, existing methods commonly resort to duplicated backbones or additional image encoders to extract garment features, which increases computational overhead and network complexity. In this paper, we propose ITVTON, an efficient framework that leverages the Diffusion Transformer (DiT) as its single generator to improve image fidelity. By concatenating garment and person images along the width dimension and incorporating textual descriptions from both, ITVTON effectively captures garment-person interactions while preserving realism. To further reduce computational cost, we restrict training to the attention parameters within a single Diffusion Transformer (Single-DiT) block. Extensive experiments demonstrate that ITVTON surpasses baseline methods both qualitatively and quantitatively, setting a new standard for virtual try-on. Moreover, experiments on 10,257 image pairs from IGPair confirm its robustness in real-world scenarios.",
keywords = "diffusion transformer, parameter training, virtual try-on",
author = "Haifeng Ni and Ming Xu",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd. 2026.; 8th Chinese Conference on Pattern Recognition and Computer Vision, PRCV 2025 ; Conference date: 15-10-2025 Through 18-10-2025",
year = "2026",
doi = "10.1007/978-981-95-5679-3\_32",
language = "英语",
isbn = "9789819556786",
series = "Lecture Notes in Computer Science",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "460--474",
editor = "Josef Kittler and Hongkai Xiong and Jian Yang and Xilin Chen and Jiwen Lu and Weiyao Lin and Jingyi Yu and Weishi Zheng",
booktitle = "Pattern Recognition and Computer Vision - 8th Chinese Conference, PRCV 2025, Proceedings",
address = "德国",
}