@inproceedings{1d66cbddec8642c9951d4d7198baa7b7,
title = "Knowledge-Constrained Answer Generation for Open-Ended Video Question Answering",
abstract = "Open-ended Video question answering (open-ended VideoQA) aims to understand video content and question semantics to generate the correct answers. Most of the best performing models define the problem as a discriminative task of multi-label classification. In real-world scenarios, however, it is difficult to define a candidate set that includes all possible answers. In this paper, we propose a Knowledge-constrained Generative VideoQA Algorithm (KcGA) with an encoder-decoder pipeline, which enables out-of-domain answer generation through an adaptive external knowledge module and a multi-stream information control mechanism. We use ClipBERT to extract the video-question features, extract framewise object-level external knowledge from a commonsense knowledge base and compute the contextual-aware episode memory units via an attention based GRU to form the external knowledge features, and exploit multi-stream information control mechanism to fuse video-question and external knowledge features such that the semantic complementation and alignment are well achieved. We evaluate our model on two open-ended benchmark datasets to demonstrate that we can effectively and robustly generate high-quality answers without restrictions of training data.",
author = "Yao Jin and Guocheng Niu and Xinyan Xiao and Jian Zhang and Xi Peng and Jun Yu",
note = "Publisher Copyright: Copyright {\textcopyright} 2023, Association for the Advancement of Artificial Intelligence (www.aaai.org). All rights reserved.; 37th AAAI Conference on Artificial Intelligence, AAAI 2023 ; Conference date: 07-02-2023 Through 14-02-2023",
year = "2023",
month = jun,
day = "27",
doi = "10.1609/aaai.v37i7.25983",
language = "英语",
series = "Proceedings of the 37th AAAI Conference on Artificial Intelligence, AAAI 2023",
publisher = "AAAI press",
pages = "8141--8149",
editor = "Brian Williams and Yiling Chen and Jennifer Neville",
booktitle = "AAAI-23 Technical Tracks 7",
}