@inproceedings{bf9821bdce4a4211a01f2d1eaf9710e0,
title = "From Feature Alignment to Multimodal Fusion: A Two-Stage Primary Modality-Guided Approach for MSA",
abstract = "Multimodal Sentiment Analysis (MSA) aims to leverage heterogeneous data-typically language, vision, and acoustic modalities-to accurately interpret human emotional states. Despite recent advances, challenges persist due to the feature distribution difference caused by intrinsic modality heterogeneity. Prior works either neglect the contribution disparity among modalities, especially the dominant role of language in sentiment reasoning, or emphasize language dominance in fusion-space alignment, ignoring coordination in the early feature space. To address these limitations, we propose a novel Two-Stage Primary Modality-Guided (TSPMG) framework, which introduces primary-modality supervision into both feature-space distribution alignment and fusion-space attention modulation. This dual-level cooperative mechanism progressively amplifies the dominant modality's influence throughout the entire representation learning pipeline. Extensive experiments on two benchmark datasets demonstrate that TSPMG achieves superior or comparable results to state-of-the-art baselines, with ablation studies further validating the effectiveness of primary-modality-guided strategies for robust and interpretable multimodal sentiment analysis. The code is available at https://github.com/Kaisa777/TSPMG.",
keywords = "Feature Alignment, Multimodal Fusion, Representation Learning, Sentiment Analysis",
author = "Guoyu Ma and Xiaoqiang Ren and Yan Jiang and Hongjiao Guan and Bing Xu",
note = "Publisher Copyright: {\textcopyright} 2025 Copyright held by the owner/author(s).; 7th ACM International Conference on Multimedia in Asia, MMAsia 2025 ; Conference date: 09-12-2025 Through 12-12-2025",
year = "2025",
month = dec,
day = "6",
doi = "10.1145/3743093.3771041",
language = "英语",
series = "Proceedings of the 7th ACM International Conference on Multimedia in Asia, MMAsia 2025",
publisher = "Association for Computing Machinery, Inc",
editor = "Tat-Seng Chua and Lai-Kuan Wong and Chan, \{Chee Seng\} and Jinhui Tang and Chong-Wah Ngo and Klaus Schoeffmann and Jiaying Liu and Yo-Sung Ho",
booktitle = "Proceedings of the 7th ACM International Conference on Multimedia in Asia, MMAsia 2025",
}