@inproceedings{ff3b01f3fc18403ebf3451f9cea1525a,
title = "A Compact and Semantic Latent Space for Disentangled and Controllable Image Editing",
abstract = "Recent advances in the field of generative models and in particular generative adversarial networks (GANs) have lead to substantial progress for controlled image editing. Despite their powerful ability to apply realistic modifications to an image, these methods often lack properties such as disentanglement (the capacity to edit attributes independently). In this paper, we propose an auto-encoder which re-organizes the latent space of StyleGAN, so that each attribute which we wish to edit corresponds to an axis of the new latent space, and furthermore that the latent axes are decorrelated, encouraging disentanglement. We work in a compressed version of the latent space, using Principal Component Analysis, meaning that the parameter complexity of our autoencoder is reduced, leading to short training times (∼45 mins). Qualitative and quantitative results demonstrate the editing capabilities of our approach, with greater disentanglement than competing methods, while maintaining fidelity to the original image with respect to identity. Our autoencoder architecture is simple and straightforward, facilitating implementation.",
keywords = "Disentanglement, GANs, Generative Models, Image Editing, Latent navigation, Neural Networks",
author = "Gwilherm Lesn{\'e} and Yann Gousseau and Sa{\"i}d Ladjal and Alasdair Newson",
note = "Publisher Copyright: {\textcopyright} 2023 ACM.; 20th ACM SIGGRAPH European Conference on Visual Media Production, CVMP 2023 ; Conference date: 30-11-2023 Through 01-12-2023",
year = "2023",
month = nov,
day = "30",
doi = "10.1145/3626495.3626508",
language = "English",
series = "Proceedings - CVMP 2023: 20th ACM SIGGRAPH European Conference on Visual Media Production",
publisher = "Association for Computing Machinery, Inc",
editor = "Spencer, \{Stephen N.\}",
booktitle = "Proceedings - CVMP 2023",
}