@inproceedings{527193a0e30547d0a67d6f7bcdf0a104,
title = "Learning Joint Multimodal Representation Based on Multi-fusion Deep Neural Networks",
abstract = "Recently, learning joint representation of multimodal data has received more and more attentions. Multimodal features are concept-level compositive features which are more effective than those single-modality features. Most existing methods only mine interactions between modalities on the top of their networks for one time to learn multi-modal representation. In this paper, we propose a multi-fusion deep learning framework which learns multimodal features richer in semantic. The framework sets multiple fusing points in different level of feature spaces, and then integrates and passes the fusing information step by step from the low level to higher levels. Moreover, we propose a multi-channel decoding network with alternate fine-tuning strategy to fully mine the modality–specific information and cross-modality correlations. We are also the first to introduce deep learning features into multimodal deep learning, alleviating the semantic and statistical property differences between modalities to learn better features. Extensive experiments on real-world datasets demonstrate that, our proposed method achieves superior performance compared with the state-of-the-art methods.",
keywords = "Deep learning, Multi-fusion, Multimodal, Semantic integration",
author = "Zepeng Gu and Bo Lang and Tongyu Yue and Lei Huang",
note = "Publisher Copyright: {\textcopyright} 2017, Springer International Publishing AG.; 24th International Conference on Neural Information Processing, ICONIP 2017 ; Conference date: 14-11-2017 Through 18-11-2017",
year = "2017",
doi = "10.1007/978-3-319-70096-0\_29",
language = "英语",
isbn = "9783319700953",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "276--285",
editor = "Dongbin Zhao and El-Alfy, \{El-Sayed M.\} and Derong Liu and Shengli Xie and Yuanqing Li",
booktitle = "Neural Information Processing - 24th International Conference, ICONIP 2017, Proceedings",
address = "德国",
}