@inproceedings{530c8432b9184d25bdfa4e90af747706,
title = "Extending long short-term memory for multi-view structured learning",
abstract = "Long Short-Term Memory (LSTM) networks have been successfully applied to a number of sequence learning problems but they lack the design flexibility to model multiple view interactions, limiting their ability to exploit multi-view relationships. In this paper, we propose a Multi-View LSTM (MV-LSTM), which explicitly models the view-specific and cross-view interactions over time or structured outputs. We evaluate the MV-LSTM model on four publicly available datasets spanning two very different structured learning problems: multimodal behaviour recognition and image captioning. The experimental results show competitive performance on all four datasets when compared with state-of-the-art models.",
keywords = "Long Short-Term Memory, Multi-View Learning, Behaviour recognition, Image Caption, Image caption, Long short-term memory, Multi-view learning",
author = "Shyam Rajagopalan and Louis-Philippe Morency and Tadas Baltrusaitis and Roland GOECKE",
year = "2016",
doi = "10.1007/978-3-319-46478-7_21",
language = "English",
isbn = "9783319464770",
volume = "9911",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer",
pages = "338--353",
editor = "Bastian Leibe and Jiri Matas and Nicu Sebe and Max Welling",
booktitle = "Proceedings of the European Conference on Computer Vision (ECCV 2016)",
address = "Netherlands",
note = "The European Conference on Computer Vision, ECCV 2016 ; Conference date: 08-10-2016 Through 16-10-2016",
}