@inproceedings{wang2025findrec, author = {Wang, Maolin and Xiao, Yutian and Wang, Binhao and Zhang, Sheng and Ye, Shanshan and Wang, Wanyu and Yin, Hongzhi and Guo, Ruocheng and Xu, Zenglin}, title = {FindRec: Stein-Guided Entropic Flow for Multi-Modal Sequential Recommendation}, year = {2025}, isbn = {9798400714542}, publisher = {Association for Computing Machinery}, address = {New York, NY, USA}, url = {https://doi.org/10.1145/3711896.3736968}, doi = {10.1145/3711896.3736968}, abstract = {Modern recommendation systems face significant challenges in processing multimodal sequential data, particularly in temporal dynamics modeling and information flow coordination. Traditional approaches struggle with distribution discrepancies between heterogeneous features and noise interference in multimodal signals. We propose FindRec (Flexible unified information disentanglement for multi-modal sequential Rec ommendation), introducing a novel ''information flow-control-output'' paradigm. The framework features two key innovations: (1) A Stein kernel-based Integrated Information Coordination Module (IICM) that theoretically guarantees distribution consistency between multimodal features and ID streams, and (2) A cross-modal expert routing mechanism that adaptively filters and combines multimodal features based on their contextual relevance. Our approach leverages multi-head subspace decomposition for routing stability and RBF-Stein gradient for unbiased distribution alignment, enhanced by linear-complexity Mamba layers for efficient temporal modeling. Extensive experiments on three real-world datasets demonstrate FindRec's superior performance over state-of-the-art baselines, particularly in handling long sequences and noisy multimodal inputs. Our framework achieves both improved recommendation accuracy and enhanced model interpretability through its modular design. The implementation code is available anonymously online for easy reproducibility https://github.com/Applied-Machine-Learning-Lab/FindRec.}, booktitle = {Proceedings of the 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining V.2}, pages = {3008–3018}, numpages = {11}, keywords = {cross-modal alignment, entropy-aware fusion, information flow control, multimodal sequential recommendation}, location = {Toronto ON, Canada}, series = {KDD '25} }