@inproceedings{168fc13151b340a08ee29b0476b13195,
title = "KSS-MoE: Knowledge Space Synergy Framework in Mixture of Experts for Continual Visual Instruction Tuning",
abstract = "Multimodal Large Language Models (MLLMs) employing the Mixture-of-Experts (MoE) structure exhibit encouraging results in visual language tasks. However, they struggle with catastrophic forgetting due to a lack of effective collaboration among experts and negative transfer across tasks. This happens because the router typically employed in MoE for managing expert assignments is inadequate when there are significant shifts in data distribution across various tasks. A drop in the effectiveness of earlier tasks is caused by negative transfer, which occurs due to conflicts in shared knowledge between tasks, disturbing the knowledge already acquired. To address these issues, we propose the Knowledge Space Synergy Framework in Mixture of Experts (KSS-MoE) for Continual Visual Instruction Tuning (CVIT). It dynamically combines the knowledge subspaces of experts to improve the integration of fine-grained complementary knowledge and collaborative abilities of experts, thus addressing the limitations of the basic router. Furthermore, we introduce a general expert that maintains orthogonal subspaces for shared knowledge, enabling effective cross-task knowledge utilization while reducing negative transfer. Extensive experiments conducted on eight CVIT tasks confirm the excellence of KSS-MoE, showcasing its top-tier performance.",
author = "Lingyun Song and Ziyao Chen and Kang Pan and Xiaolin Han and Xinbiao Gan and Yudai Pan and Xiaofan Sun and Xiaoqi Wang and Xuequn Shang",
note = "Publisher Copyright: {\textcopyright} 2026, Association for the Advancement of Artificial Intelligence. All rights reserved.; 40th AAAI Conference on Artificial Intelligence, AAAI 2026 ; Conference date: 20-01-2026 Through 27-01-2026",
year = "2026",
doi = "10.1609/aaai.v40i30.39749",
language = "英语",
isbn = "9781577359067",
series = "Proceedings of the AAAI Conference on Artificial Intelligence",
publisher = "Association for the Advancement of Artificial Intelligence",
number = "30",
pages = "25536--25544",
editor = "Sven Koenig and Chad Jenkins and Taylor, \{Matthew E.\}",
booktitle = "Proceedings of the AAAI Conference on Artificial Intelligence",
edition = "30",
}