@inproceedings{4cfc48d4442741998a422f034adc9809,
title = "Multimodal Variational Autoencoders for Sensor Fusion and Cross Generation",
abstract = "The cognitive system of humans, which allows them to create representations of their surroundings exploiting multiple senses, has inspired several applications to mimic this remarkable property. The key for learning rich representations of data collected by multiple, diverse sensors, is to design generative models that can ingest multimodal inputs, and merge them in a common space. This enables to: i) obtain a coherent generation of samples for all modalities, ii) enable cross-sensor generation, by using available modalities to generate missing ones and iii) exploit synergy across modalities, to increase reconstruction quality. In this work, we study multimodal variational autoencoders, and propose new methods for learning a joint representation that can both improve synergy and enable cross generation of missing sensor data. We evaluate these approaches on well-established datasets as well as on a new dataset that involves multimodal object detection with three modalities. Our results shed light on the role of joint posterior modeling and training objectives, indicating that even simple and efficient heuristics enable both synergy and cross generation properties to coexist.",
keywords = "Autoencoder, Multimodal, Variational",
author = "Silva-Filarder, {Matthieu Da} and Andrea Ancora and Maurizio Filippone and Pietro Michiardi",
note = "Publisher Copyright: {\textcopyright} 2021 IEEE.; 20th IEEE International Conference on Machine Learning and Applications, ICMLA 2021 ; Conference date: 13-12-2021 Through 16-12-2021",
year = "2021",
doi = "10.1109/ICMLA52953.2021.00175",
language = "English (US)",
series = "Proceedings - 20th IEEE International Conference on Machine Learning and Applications, ICMLA 2021",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "1069--1076",
editor = "Wani, {M. Arif} and Sethi, {Ishwar K.} and Weisong Shi and Guangzhi Qu and Raicu, {Daniela Stan} and Ruoming Jin",
booktitle = "Proceedings - 20th IEEE International Conference on Machine Learning and Applications, ICMLA 2021",
address = "United States",
}