@inproceedings{d82802b08bd0419b81da6c36544d5076,
title = "SaliencyBERT: Recurrent Attention Network for Target-Oriented Multimodal Sentiment Classification",
abstract = "As multimodal data become increasingly popular on social media platforms, it is desirable to enhance text-based approaches with other important data sources (e.g. images) for the Sentiment Classification of social media posts. However, existing approaches primarily rely on the textual content or are designed for the coarse-grained Multimodal Sentiment Classification. In this paper, we propose a recurrent attention network (called SaliencyBERT) over the BERT architecture for Target-oriented Multimodal Sentiment Classification (TMSC). Specifically, we first adopt BERT and ResNet to capture the intra-modality dynamics with the textual content and the visual information respectively. Then, we design a recurrent attention mechanism, which can derive target-sensitive visual representations, to capture the inter-modality dynamics. With recurrent attention, our model can progressively optimize the alignment of target-sensitive textual features and visual features and produce an output after a fixed number of time steps. Finally, we combine the loss of all-time steps for deep supervision to prevent converging slower and overfitting. Our empirical results show that the proposed model consistently outperforms single modal methods and achieves an indistinguishable or even better performance on several highly competitive methods on two multimodal datasets from Twitter.",
keywords = "BERT architecture, Recurrent attention, Target-oriented multimodal sentiment classification",
author = "Jiawei Wang and Zhe Liu and Victor Sheng and Yuqing Song and Chenjian Qiu",
note = "Publisher Copyright: {\textcopyright} 2021, Springer Nature Switzerland AG.; null ; Conference date: 29-10-2021 Through 01-11-2021",
year = "2021",
doi = "10.1007/978-3-030-88010-1_1",
language = "English",
isbn = "9783030880095",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "3--15",
editor = "Huimin Ma and Liang Wang and Changshui Zhang and Fei Wu and Tieniu Tan and Yaonan Wang and Jianhuang Lai and Yao Zhao",
booktitle = "Pattern Recognition and Computer Vision - 4th Chinese Conference, PRCV 2021, Proceedings",
}