@inproceedings{e5716ece5c8a4a68b44c10e2ae07b074,
title = "Single Cross-domain Semantic Guidance Network for Multimodal Unsupervised Image Translation",
abstract = "Multimodal image-to-image translation has received great attention due to its flexibility and practicality. The existing methods lack the generality of effective style representation, and cannot capture different levels of stylistic semantic information from cross-domain images. Besides, they ignore the parallelism for cross-domain image generation, and their generator can only be responsible for specific domains. To address these issues, we propose a novel Single Cross-domain Semantic Guidance Network (SCSG-Net) for coarse-to-fine semantically controllable multimodal image translation. Images from different domains are mapped to a unified visual semantic latent space by a dual sparse feature pyramid encoder, and then the generative module generates the result images by extracting semantic style representation from the input images in a self-supervised manner guided by adaptive discrimination. Especially, our SCSG-Net meets the needs of users in different styles as well as diverse scenarios. Extensive experiments on different benchmark datasets show that our method can outperform other state-of-the-art methods both quantitatively and qualitatively.",
keywords = "Multimodal image translation, Semantic guidance, Unsupervised learning",
author = "Jiaying Lan and Lianglun Cheng and Guoheng Huang and Pun, \{Chi Man\} and Xiaochen Yuan and Shangyu Lai and Liu, \{Hong Rui\} and Ling, \{Wing Kuen\}",
note = "Publisher Copyright: {\textcopyright} 2023, The Author(s), under exclusive license to Springer Nature Switzerland AG.; 29th International Conference on MultiMedia Modeling, MMM 2023 ; Conference date: 09-01-2023 Through 12-01-2023",
year = "2023",
doi = "10.1007/978-3-031-27077-2\_13",
language = "English",
isbn = "9783031270765",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "165--177",
editor = "Duc-Tien Dang-Nguyen and Cathal Gurrin and Smeaton, \{Alan F.\} and Martha Larson and Stevan Rudinac and Minh-Son Dao and Christoph Trattner and Phoebe Chen",
booktitle = "MultiMedia Modeling - 29th International Conference, MMM 2023, Proceedings",
address = "Germany",
}