@inproceedings{beb034f637a74b8dbd03eb4596017e83,
title = "Uni-DlLoRA: Style Fine-Tuning for Fashion Image Translation",
abstract = "Image-to-image (i2i) translation has achieved notable success, yet remains challenging in scenarios like real-to-illustrative style transfer of fashion. Existing methods focus on enhancing the generative model with diversity while lacking ID-preserved domain translation. This paper introduces a novel model named Uni-DlLoRA to release this constraint. The proposed model combines the original images within a pretrained diffusion-based model using the proposed Uni-adapter extractors, while adopting the proposed Dual-LoRA module to provide distinct style guidance. This approach optimizes generative capabilities and reduces the number of additional parameters required. In addition, a new multimodal dataset featuring higher-quality images with captions built upon an existing real-to-illustration dataset is proposed. Experimentation validates the effectiveness of our proposed method.",
keywords = "denoising diffusion probabilistic models, fashion synthesis, image-to-image translation",
author = "Fangjian Liao and Xingxing Zou and Wong, \{Wai Keung\}",
note = "Publisher Copyright: {\textcopyright} 2024 Owner/Author.; 32nd ACM International Conference on Multimedia, MM 2024 ; Conference date: 28-10-2024 Through 01-11-2024",
year = "2024",
month = oct,
day = "28",
doi = "10.1145/3664647.3681459",
language = "English",
series = "MM 2024 - Proceedings of the 32nd ACM International Conference on Multimedia",
publisher = "Association for Computing Machinery, Inc",
pages = "6404--6413",
booktitle = "MM 2024 - Proceedings of the 32nd ACM International Conference on Multimedia",
}