@inproceedings{3413f53742cf4994a2ad2cc55701b36e,
title = "LD-BFR: Vector-Quantization-Based Face Restoration Model with Latent Diffusion Enhancement",
abstract = "Blind Face Restoration (BFR) aims to restore high-quality face images from low-quality images with unknown degradation. Previous GAN-based or ViT-based methods have shown promising results, but have identity details loss once degradation is severe; while recent diffusion-based methods work on image level and take a lot of time to infer. To restore images in any degradation types with high quality and spend less time compared to the classic diffusion-based method, we propose LD-BFR, a novel BFR framework that integrates both the strengths of vector quantization and latent diffusion. First, we employ a Dual Cross-Attention vector quantization to restore the degraded image in a global manner. Then we utilize the restored high-quality quantized feature as the guidance in our latent diffusion model to generate high-quality restored images with rich details. With the help of the proposed high-quality feature injection module, our LD-BFR effectively injects the high-quality feature as a condition to guide the generation of our latent diffusion model. Extensive experiments demonstrate the superior performance of our model over the SOTA BFR methods. The code is available at: https://github.com/YuzhenD/LD-BFR.git.",
keywords = "blind face restoration, diffusion, vector-quantization",
author = "Yuzhen Du and Teng Hu and Ran Yi and Lizhuang Ma",
note = "Publisher Copyright: {\textcopyright} 2024 ACM.; 32nd ACM International Conference on Multimedia, MM 2024 ; Conference date: 28-10-2024 Through 01-11-2024",
year = "2024",
month = oct,
day = "28",
doi = "10.1145/3664647.3680853",
language = "英语",
series = "MM 2024 - Proceedings of the 32nd ACM International Conference on Multimedia",
publisher = "Association for Computing Machinery, Inc",
pages = "2852--2860",
booktitle = "MM 2024 - Proceedings of the 32nd ACM International Conference on Multimedia",
}