@inproceedings{940fed6a0ac94babb73d26f11d8c055e,
title = "Learning in Order! A Sequential Strategy to Learn Invariant Features for Multimodal Sentiment Analysis",
abstract = "This work proposes a novel and simple sequential learning strategy to train models on videos and texts for multimodal sentiment analysis. To estimate sentiment polarities on unseen out-of-distribution data, we introduce a multimodal model that is trained either in a single source domain or multiple source domains using our learning strategy. This strategy starts with learning domain invariant features from the text, followed by learning sparse domain-agnostic features from videos, assisted by the selected features learned in text. Our experimental results demonstrate that our model achieves significantly better performance than the state-of-the-art approaches on average in both single-source and multi-source settings. Our feature selection procedure favors the features that are independent to each other and are strongly correlated with their polarity labels. To facilitate research on this topic, the source code of this work will be publicly available upon acceptance.",
keywords = "causal inference, feature selection, msa, ood",
author = "Xianbing Zhao and Lizhen Qu and Tao Feng and Jianfei Cai and Buzhou Tang",
note = "Publisher Copyright: {\textcopyright} 2024 ACM.; 32nd ACM International Conference on Multimedia, MM 2024 ; Conference date: 28-10-2024 Through 01-11-2024",
year = "2024",
month = oct,
day = "28",
doi = "10.1145/3664647.3681056",
language = "英语",
series = "MM 2024 - Proceedings of the 32nd ACM International Conference on Multimedia",
publisher = "Association for Computing Machinery, Inc",
pages = "9729--9738",
booktitle = "MM 2024 - Proceedings of the 32nd ACM International Conference on Multimedia",
}