@inproceedings{019d804986424e019f1052bf1fb82251,
title = "Coupled learning for image generation and latent representation inference using mmd",
abstract = "For modeling the data distribution or the latent representation distribution in the image domain, deep learning methods such as the variational autoencoder (VAE) and the generative adversarial network (GAN) have been proposed. However, despite its capability of modeling these two distributions, VAE tends to learn less meaningful latent representations; GAN can only model the data distribution using the challenging and unstable adversarial training. To address these issues, we propose an unsupervised learning framework to perform coupled learning of these two distributions based on kernel maximum mean discrepancy (MMD). Specifically, the proposed framework consists of (1) an inference network and a generation network for mapping between the data space and the latent space, and (2) a latent tester and a data tester for performing two-sample tests in these two spaces, respectively. On one hand, we perform a two-sample test between stochastic representations from the prior distribution and inferred representations from the inference network. On the other hand, we perform a two-sample test between the real data and generated data. In addition, we impose structural regularization that the two networks are inverses of each other, so that the learning of these two distributions can be coupled. Experimental results on benchmark image datasets demonstrate that the proposed framework is competitive on image generation and latent representation inference of images compared with representative approaches.",
keywords = "Coupled learning, Image generation, Latent representation inference, Maximum mean discrepancy",
author = "Sheng Qian and Wen-ming Cao and Rui Li and Si Wu and Hau-san Wong",
year = "2018",
month = sep,
doi = "10.1007/978-3-030-00767-6_40",
language = "English",
isbn = "978-3-030-00766-9",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "430--440",
editor = "Hong, {Richang } and Cheng, {Wen-Huang } and Toshihiko Yamasaki and Wang, {Meng } and Ngo, {Chong-Wah }",
booktitle = "Advances in Multimedia Information Processing – PCM 2018",
address = "Germany",
note = "19th Pacific-Rim Conference on Multimedia (PCM 2018) ; Conference date: 21-09-2018 Through 22-09-2018",
}