{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,19]],"date-time":"2026-05-19T17:07:20Z","timestamp":1779210440536,"version":"3.51.4"},"reference-count":127,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,5,19]],"date-time":"2026-05-19T00:00:00Z","timestamp":1779148800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,5,19]],"date-time":"2026-05-19T00:00:00Z","timestamp":1779148800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Multimed Info Retr"],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1007\/s13735-026-00406-x","type":"journal-article","created":{"date-parts":[[2026,5,19]],"date-time":"2026-05-19T16:22:24Z","timestamp":1779207744000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["A survey of multimodal recommender systems: methods, challenges, and future directions"],"prefix":"10.1007","volume":"15","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-3076-4546","authenticated-orcid":false,"given":"Ziyu","family":"Li","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6785-1203","authenticated-orcid":false,"given":"Shiqing","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9215-4979","authenticated-orcid":false,"given":"Weihua","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1214-6317","authenticated-orcid":false,"given":"Quan","family":"Bai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9149-2922","authenticated-orcid":false,"given":"Jianhua","family":"Jiang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,5,19]]},"reference":[{"issue":"5","key":"406_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3407190","volume":"53","author":"Y Deldjoo","year":"2020","unstructured":"Deldjoo Y, Schedl M, Cremonesi P, Pasi G (2020) Recommender systems leveraging multimedia content. ACM Computing Surveys (CSUR) 53(5):1\u201338","journal-title":"ACM Computing Surveys (CSUR)"},{"issue":"1","key":"406_CR2","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3158369","volume":"52","author":"S Zhang","year":"2019","unstructured":"Zhang S, Yao L, Sun A, Tay Y (2019) Deep learning based recommender system: A survey and new perspectives. ACM Comput Surv 52(1):1\u201338","journal-title":"ACM Comput Surv"},{"issue":"3","key":"406_CR3","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3662738","volume":"3","author":"D Malitesta","year":"2025","unstructured":"Malitesta D, Cornacchia G, Pomo C, Merra FA, Di Noia T, Di Sciascio E (2025) Formalizing multimedia recommendation through multimodal deep learning. ACM Transactions on Recommender Systems 3(3):1\u201333","journal-title":"ACM Transactions on Recommender Systems"},{"issue":"2","key":"406_CR4","doi-asserted-by":"publisher","first-page":"423","DOI":"10.1109\/TPAMI.2018.2798607","volume":"41","author":"T Baltru\u0161aitis","year":"2019","unstructured":"Baltru\u0161aitis T, Ahuja C, Morency L-P (2019) Multimodal machine learning: A survey and taxonomy. IEEE Trans Pattern Anal Mach Intell 41(2):423\u2013443","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"406_CR5","unstructured":"Zhou H, Zhou X, Zeng Z, Zhang L, Shen Z (2023) A comprehensive survey on multimodal recommender systems: Taxonomy, evaluation, and future directions. arXiv preprint arXiv:2302.04473"},{"issue":"8","key":"406_CR6","doi-asserted-by":"publisher","first-page":"3549","DOI":"10.1109\/TKDE.2020.3028705","volume":"34","author":"Q Guo","year":"2020","unstructured":"Guo Q, Zhuang F, Qin C, Zhu H, Xie X, Xiong H, He Q (2020) A survey on knowledge graph-based recommender systems. IEEE Trans Knowl Data Eng 34(8):3549\u20133568","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"406_CR7","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser \u0141, Polosukhin I (2017) Attention is all you need. Adv Neural Inf Process Syst 30"},{"key":"406_CR8","doi-asserted-by":"crossref","unstructured":"He R, McAuley J (2016) Vbpr: visual bayesian personalized ranking from implicit feedback. Proceedings of the AAAI Conference on Artificial Intelligence 30","DOI":"10.1609\/aaai.v30i1.9973"},{"key":"406_CR9","doi-asserted-by":"crossref","unstructured":"Wei Y, Wang X, Nie L, He X, Hong R, Chua T-S (2019) Mmgcn: Multi-modal graph convolution network for personalized recommendation of micro-video. Proceedings of the 27th ACM International Conference on Multimedia. pp 1437\u20131445","DOI":"10.1145\/3343031.3351034"},{"issue":"5","key":"406_CR10","doi-asserted-by":"publisher","DOI":"10.1016\/j.ipm.2020.102277","volume":"57","author":"Z Tao","year":"2020","unstructured":"Tao Z, Wei Y, Wang X, He X, Huang X, Chua T-S (2020) Mgat: Multimodal graph attention network for recommendation. Information Processing & Management 57(5):102277","journal-title":"Information Processing & Management"},{"key":"406_CR11","doi-asserted-by":"publisher","first-page":"1074","DOI":"10.1109\/TMM.2021.3138298","volume":"25","author":"Q Wang","year":"2021","unstructured":"Wang Q, Wei Y, Yin J, Wu J, Song X, Nie L (2021) Dualgnn: Dual graph neural network for multimedia recommendation. IEEE Trans Multimedia 25:1074\u20131084","journal-title":"IEEE Trans Multimedia"},{"issue":"5","key":"406_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3535101","volume":"55","author":"S Wu","year":"2022","unstructured":"Wu S, Sun F, Zhang W, Xie X, Cui B (2022) Graph neural networks in recommender systems: a survey. ACM Comput Surv 55(5):1\u201337","journal-title":"ACM Comput Surv"},{"key":"406_CR13","doi-asserted-by":"publisher","first-page":"1067","DOI":"10.1109\/TMM.2021.3111487","volume":"24","author":"J Yi","year":"2021","unstructured":"Yi J, Chen Z (2021) Multi-modal variational graph auto-encoder for recommendation systems. IEEE Trans Multimedia 24:1067\u20131079","journal-title":"IEEE Trans Multimedia"},{"key":"406_CR14","doi-asserted-by":"publisher","first-page":"7149","DOI":"10.1109\/TMM.2022.3217449","volume":"25","author":"F Liu","year":"2022","unstructured":"Liu F, Chen H, Cheng Z, Liu A, Nie L, Kankanhalli M (2022) Disentangled multimodal representation learning for recommendation. IEEE Trans Multimedia 25:7149\u20137159","journal-title":"IEEE Trans Multimedia"},{"key":"406_CR15","doi-asserted-by":"crossref","unstructured":"Zhou X, Shen Z (2023) A tale of two graphs: Freezing and denoising graph structures for multimodal recommendation. Proceedings of the 31st ACM International Conference on Multimedia. pp 935\u2013943","DOI":"10.1145\/3581783.3611943"},{"key":"406_CR16","doi-asserted-by":"crossref","unstructured":"Zhou H, Zhou X, Zhang L, Shen Z (2023) Enhancing dyadic relations with homogeneous graphs for multimodal recommendation. In: Proceedings of the 26th European Conference on Artificial Intelligence (ECAI), pp. 3123\u20133130","DOI":"10.3233\/FAIA230631"},{"key":"406_CR17","doi-asserted-by":"crossref","unstructured":"Ma S, Zeng Y, Wu S, Xu G (2025) Refining contrastive learning and homography relations for multi-modal recommendation. Proceedings of the 33rd ACM International Conference on Multimedia. pp 6316\u20136324","DOI":"10.1145\/3746027.3755779"},{"key":"406_CR18","doi-asserted-by":"crossref","unstructured":"Jiang Y, Xia L, Wei W, Luo D, Lin K, Huang C (2024) Diffmm: Multi-modal diffusion model for recommendation. Proceedings of the 32nd ACM International Conference on Multimedia. pp 7591\u20137599","DOI":"10.1145\/3664647.3681498"},{"key":"406_CR19","doi-asserted-by":"crossref","unstructured":"Wei W, Tang J, Jiang Y, Xia L, Huang C (2024) Promptmm: Multi-modal knowledge distillation for recommendation with prompt-tuning. Proceedings of the ACM Web Conference 2024. pp 3217\u20133228","DOI":"10.1145\/3589334.3645359"},{"key":"406_CR20","doi-asserted-by":"crossref","unstructured":"Liu Y, Zhang K, Ren X, Huang Y, Jin J, Qin Y, Su R, Xu R, Yu Y, Zhang W (2024) Alignrec: Aligning and training in multimodal recommendations. In: Proceedings of the 33rd ACM International Conference on Information and Knowledge Management, pp. 1503\u20131512","DOI":"10.1145\/3627673.3679626"},{"key":"406_CR21","doi-asserted-by":"publisher","first-page":"13069","DOI":"10.1609\/aaai.v39i12.33426","volume":"39","author":"Y Ye","year":"2025","unstructured":"Ye Y, Zheng Z, Shen Y, Wang T, Zhang H, Zhu P, Yu R, Zhang K, Xiong H (2025) Harnessing multimodal large language models for multimodal sequential recommendation. Proceedings of the AAAI Conference on Artificial Intelligence 39:13069\u201313077","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence"},{"issue":"5","key":"406_CR22","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1007\/s11280-024-01291-2","volume":"27","author":"L Wu","year":"2024","unstructured":"Wu L, Zheng Z, Qiu Z, Wang H, Gu H, Shen T, Qin C, Zhu C, Zhu H, Liu Q, Xiong H, Chen E (2024) A survey on large language models for recommendation. World Wide Web 27(5):60","journal-title":"World Wide Web"},{"issue":"2","key":"406_CR23","first-page":"1","volume":"57","author":"Q Liu","year":"2024","unstructured":"Liu Q, Hu J, Xiao Y, Zhao X, Gao J, Wang W, Li Q, Tang J (2024) Multimodal recommender systems: A survey. ACM Comput Surv 57(2):1\u201317","journal-title":"ACM Comput Surv"},{"issue":"03","key":"406_CR24","doi-asserted-by":"publisher","first-page":"411","DOI":"10.1142\/S1793351X17500039","volume":"11","author":"M Ge","year":"2017","unstructured":"Ge M, Persia F (2017) A survey of multimedia recommender systems: Challenges and opportunities. International Journal of Semantic Computing 11(03):411\u2013428","journal-title":"International Journal of Semantic Computing"},{"key":"406_CR25","doi-asserted-by":"crossref","unstructured":"Xu J, Chen Z, Yang S, Li J, Wang W, Hu X, Hoi S, Ngai E (2025) A survey on multimodal recommender systems: Recent advances and future directions.(arXiv preprint)","DOI":"10.1109\/TMM.2026.3668620"},{"key":"406_CR26","unstructured":"Ramisa A, Vidal R, Deldjoo Y, He Z, McAuley J, Korikov A, Sanner S, Sathiamoorthy M, Kasrizadeh A, Milano S, et al (2024) Multi-modal generative models in recommendation system. arXiv preprint arXiv:2409.10993"},{"key":"406_CR27","unstructured":"Wei T-R, Fang Y (2025) Diffusion models in recommendation systems: A survey.(arXiv preprint)"},{"key":"406_CR28","unstructured":"Radford A, Kim JW, Hallacy C, Ramesh A, Goh G, Agarwal S, Sastry G, Askell A, Mishkin P, Clark J (2021) Learning transferable visual models from natural language supervision. International Conference on Machine Learning. pp 8748\u20138763 (PMLR)"},{"key":"406_CR29","doi-asserted-by":"publisher","first-page":"12908","DOI":"10.1609\/aaai.v39i12.33408","volume":"39","author":"J Xu","year":"2025","unstructured":"Xu J, Chen Z, Yang S, Li J, Wang H, Ngai EC (2025) Mentor: multi-level self-supervised learning for multimodal recommendation. Proceedings of the AAAI Conference on Artificial Intelligence 39:12908\u201312917","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence"},{"issue":"1","key":"406_CR30","doi-asserted-by":"publisher","first-page":"12062","DOI":"10.1038\/s41598-025-96458-w","volume":"15","author":"X Xiao","year":"2025","unstructured":"Xiao X (2025) Mmagentrec, a personalized multi-modal recommendation agent with large language model. Sci Rep 15(1):12062","journal-title":"Sci Rep"},{"key":"406_CR31","doi-asserted-by":"crossref","unstructured":"McAuley J, Targett C, Shi Q, Van Den Hengel, A (2015) Image-based recommendations on styles and substitutes. In: Proceedings of the 38th International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 43\u201352","DOI":"10.1145\/2766462.2767755"},{"issue":"2","key":"406_CR32","doi-asserted-by":"publisher","first-page":"317","DOI":"10.1109\/TKDE.2018.2881260","volume":"32","author":"Q Cui","year":"2018","unstructured":"Cui Q, Wu S, Liu Q, Zhong W, Wang L (2018) Mv-rnn: A multi-view recurrent neural network for sequential recommendation. IEEE Trans Knowl Data Eng 32(2):317\u2013331","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"406_CR33","unstructured":"Li J, Li D, Xiong C, Hoi S.C.H (2022) Blip: Bootstrapping language-image pre-training for unified vision-language understanding and generation. In: Proceedings of the 39th International Conference on Machine Learning (ICML). PMLR, 162:12888\u201312900"},{"key":"406_CR34","unstructured":"Bao H, Wang W, Dong L, Liu Q, Mohammed OK, Aggarwal K, Som S, Piao S, Wei F (2022) Vlmo: Unified vision-language pre-training with mixture-of-modality-experts. Advances in Neural Information Processing Systems (NeurIPS)"},{"key":"406_CR35","unstructured":"Yi Z, Long Z, Ounis I, Macdonald C, Mccreadie R (2023) Large multi-modal encoders for recommendation.(arXiv preprint)"},{"key":"406_CR36","doi-asserted-by":"crossref","unstructured":"Yi Z, Long Z, Ounis I, Macdonald C, McCreadie R (2025) Enhancing recommender systems: Deep modality alignment with large multi-modal encoders. ACM Transactions on Recommender Systems","DOI":"10.1145\/3718099"},{"key":"406_CR37","doi-asserted-by":"crossref","unstructured":"Yu P, Tan Z, Lu G, Bao B-K (2023) Multi-view graph convolutional network for multimedia recommendation. Proceedings of the 31st ACM International Conference on Multimedia. pp 6576\u20136585","DOI":"10.1145\/3581783.3613915"},{"key":"406_CR38","doi-asserted-by":"crossref","unstructured":"Liu X, Tao Z, Shao J, Yang L, Huang X (2022) Elimrec: Eliminating single-modal bias in multimedia recommendation. Proceedings of the 30th ACM International Conference on Multimedia. pp 687\u2013695","DOI":"10.1145\/3503161.3548404"},{"key":"406_CR39","doi-asserted-by":"crossref","unstructured":"Yang W, Fang Z, Zhang T, Wu S, Lu C (2023) Modal-aware bias constrained contrastive learning for multimodal recommendation. Proceedings of the 31st ACM International Conference on Multimedia. pp 6369\u20136378","DOI":"10.1145\/3581783.3612568"},{"key":"406_CR40","doi-asserted-by":"crossref","unstructured":"Lin X, Liu R, Cao Y, Zou L, Li Q, Wu Y, Liu Y, Yin D, Xu G (2025) Contrastive modality-disentangled learning for multimodal recommendation. ACM Transactions on Information Systems","DOI":"10.1145\/3715876"},{"issue":"1","key":"406_CR41","first-page":"1","volume":"37","author":"Y Tan","year":"2025","unstructured":"Tan Y, Wang M, Wang C, Zhao X (2025) Ammrm: an adaptive multi-modal recommendation model with noise filtering and modal feature enhancement. Journal of King Saud University Computer and Information Sciences 37(1):1\u201318","journal-title":"Journal of King Saud University Computer and Information Sciences"},{"key":"406_CR42","doi-asserted-by":"crossref","unstructured":"Wang C, Niepert M, Li H (2018) Lrmm: Learning to recommend with missing modalities. Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing. pp 3360\u20133370","DOI":"10.18653\/v1\/D18-1373"},{"key":"406_CR43","doi-asserted-by":"publisher","first-page":"8941","DOI":"10.1109\/TMM.2024.3384058","volume":"26","author":"J Yi","year":"2024","unstructured":"Yi J, Chen Z (2024) Variational mixture of stochastic experts auto-encoder for multi-modal recommendation. IEEE Trans Multimedia 26:8941\u20138954","journal-title":"IEEE Trans Multimedia"},{"key":"406_CR44","doi-asserted-by":"crossref","unstructured":"Hu H, Guo W, Liu Y, Kan M-Y (2023) Adaptive multi-modalities fusion in sequential recommendation systems. Proceedings of the 32nd ACM International Conference on Information and Knowledge Management. pp 843\u2013853","DOI":"10.1145\/3583780.3614775"},{"key":"406_CR45","doi-asserted-by":"crossref","unstructured":"Malitesta D, Rossi E, Pomo C, Di Noia T, Malliaros F.D (2024) Do we really need to drop items with missing modalities in multimodal recommendation? In: Proceedings of the 33rd ACM International Conference on Information and Knowledge Management, pp. 3943\u20133948","DOI":"10.1145\/3627673.3679898"},{"key":"406_CR46","doi-asserted-by":"crossref","unstructured":"Ganh\u00f6r C, Moscati M, Hausberger A, Nawaz S, Schedl M (2024) A multimodal single-branch embedding network for recommendation in cold-start and missing modality scenarios. Proceedings of the 18th ACM Conference on Recommender Systems. pp 380\u2013390","DOI":"10.1145\/3640457.3688138"},{"key":"406_CR47","doi-asserted-by":"crossref","unstructured":"He X, Deng K, Wang X, Li Y, Zhang Y, Wang M (2020) Lightgcn: Simplifying and powering graph convolution network for recommendation. In: Proceedings of the 43rd International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 639\u2013648","DOI":"10.1145\/3397271.3401063"},{"key":"406_CR48","doi-asserted-by":"crossref","unstructured":"Zhou X (2023) Mmrec: Simplifying multimodal recommendation. Proceedings of the 5th ACM International Conference on Multimedia in Asia Workshops. pp 1\u20132","DOI":"10.1145\/3611380.3628561"},{"key":"406_CR49","first-page":"14200","volume":"34","author":"A Nagrani","year":"2021","unstructured":"Nagrani A, Yang S, Arnab A, Jansen A, Schmid C, Sun C (2021) Attention bottlenecks for multimodal fusion. Adv Neural Inf Process Syst 34:14200\u201314213","journal-title":"Adv Neural Inf Process Syst"},{"key":"406_CR50","doi-asserted-by":"publisher","first-page":"8454","DOI":"10.1609\/aaai.v38i8.28688","volume":"38","author":"Z Guo","year":"2024","unstructured":"Guo Z, Li J, Li G, Wang C, Shi S, Ruan B (2024) Lgmrec: Local and global graph learning for multimodal recommendation. Proceedings of the AAAI Conference on Artificial Intelligence 38:8454\u20138462","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence"},{"key":"406_CR51","doi-asserted-by":"crossref","unstructured":"Zhang J, Zhu Y, Liu Q, Wu S, Wang S, Wang L (2021) Mining latent structures for multimedia recommendation. In: Proceedings of the 29th ACM International Conference on Multimedia, pp. 3872\u20133880","DOI":"10.1145\/3474085.3475259"},{"key":"406_CR52","doi-asserted-by":"crossref","unstructured":"Mu Z, Zhuang Y, Tan J, Xiao J, Tang S (2022) Learning hybrid behavior patterns for multimedia recommendation. In: Proceedings of the 30th ACM International Conference on Multimedia, pp. 376\u2013384","DOI":"10.1145\/3503161.3548119"},{"key":"406_CR53","doi-asserted-by":"crossref","unstructured":"Sun R, Cao X, Zhao Y, Wan J, Zhou K, Zhang F, Wang Z, Zheng,d K (2020) Multi-modal knowledge graphs for recommender systems. In: Proceedings of the 29th ACM International Conference on Information & Knowledge Management, pp. 1405\u20131414","DOI":"10.1145\/3340531.3411947"},{"key":"406_CR54","doi-asserted-by":"crossref","unstructured":"Liu Y, Yang S, Lei C, Wang G, Tang H, Zhang J, Sun A, Miao C (2021) Pre-training graph transformer with multimodal side information for recommendation. Proceedings of the 29th ACM International Conference on Multimedia. pp 2853\u20132861","DOI":"10.1145\/3474085.3475709"},{"key":"406_CR55","doi-asserted-by":"crossref","unstructured":"Xu Q, Shen F, Liu L, Shen H.T (2018) Graphcar: Content-aware multimedia recommendation with graph autoencoder. In: The 41st International ACM SIGIR Conference on Research & Development in Information Retrieval, pp. 981\u2013984","DOI":"10.1145\/3209978.3210117"},{"key":"406_CR56","doi-asserted-by":"crossref","unstructured":"Chen J, Zhang H, He X, Nie L, Liu W, Chua T-S (2017) Attentive collaborative filtering: Multimedia recommendation with item-and component-level attention. Proceedings of the 40th International ACM SIGIR Conference on Research and Development in Information Retrieval. pp 335\u2013344","DOI":"10.1145\/3077136.3080797"},{"key":"406_CR57","doi-asserted-by":"crossref","unstructured":"Zhou Y, Guo J, Sun H, Song B, Yu FR (2023) Attention-guided multi-step fusion: A hierarchical fusion network for multimodal recommendation. Proceedings of the 46th International Acm Sigir Conference on Research and Development in Information Retrieval. pp 1816\u20131820","DOI":"10.1145\/3539618.3591950"},{"issue":"2","key":"406_CR58","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3291060","volume":"37","author":"Z Cheng","year":"2019","unstructured":"Cheng Z, Chang X, Zhu L, Kanjirathinkal RC, Kankanhalli M (2019) Mmalfm: Explainable recommendation by leveraging reviews and images. ACM Transactions on Information Systems (TOIS) 37(2):1\u201328","journal-title":"ACM Transactions on Information Systems (TOIS)"},{"key":"406_CR59","doi-asserted-by":"crossref","unstructured":"Liu F, Cheng Z, Sun C, Wang Y, Nie L, Kankanhalli M (2019) User diverse preference modeling by multimodal attentive metric learning. Proceedings of the 27th ACM International Conference on Multimedia. pp 1526\u20131534","DOI":"10.1145\/3343031.3350953"},{"key":"406_CR60","doi-asserted-by":"crossref","unstructured":"Han T, Wang P, Niu S, Li C (2022) Modality matches modality: Pretraining modality-disentangled item representations for recommendation. Proceedings of the ACM Web Conference 2022. pp 2058\u20132066","DOI":"10.1145\/3485447.3512079"},{"key":"406_CR61","doi-asserted-by":"crossref","unstructured":"Wei W, Huang C, Xia L, Zhang C (2023) Multi-modal self-supervised learning for recommendation. Proceedings of the ACM Web Conference 2023. pp 790\u2013800","DOI":"10.1145\/3543507.3583206"},{"key":"406_CR62","doi-asserted-by":"crossref","unstructured":"Wang S, Wang Y (2023) 3mvgat: Multi-modal and multi-view knowledge graph attention network for recommendation algorithm. In: 2023 4th International Conference on Computers and Artificial Intelligence Technology (CAIT), pp. 26\u201333. IEEE","DOI":"10.1109\/CAIT59945.2023.10468706"},{"key":"406_CR63","unstructured":"Ma L, Li X, Fan Z, Zhao K, Xu J, Cho J, Kanumala P, Nag K, Kumar S, Achan K (2024) Triple modality fusion: Aligning visual, textual, and graph data with large language models for multi-behavior recommendations.(arXiv preprint)"},{"issue":"10","key":"406_CR64","doi-asserted-by":"publisher","first-page":"18587","DOI":"10.1109\/TNNLS.2025.3583509","volume":"36","author":"Q Song","year":"2025","unstructured":"Song Q, Hu J, Xiao L, Sun B, Gao X, Li S (2025) Diffcl: A diffusion-based contrastive learning framework with semantic alignment for multimodal recommendations. IEEE Transactions on Neural Networks and Learning Systems 36(10):18587\u201318597","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"key":"406_CR65","doi-asserted-by":"crossref","unstructured":"Liu Q, Wu S, Wang L (2017) Deepstyle: Learning user preferences for visual recommendation. Proceedings of the 40th International Acm Sigir Conference on Research and Development in Information Retrieval. pp 841\u2013844","DOI":"10.1145\/3077136.3080658"},{"key":"406_CR66","doi-asserted-by":"crossref","unstructured":"He R, Fang C, Wang Z, McAuley J (2016) Vista: A visually, socially, and temporally-aware model for artistic recommendation. In: Proceedings of the 10th ACM Conference on Recommender Systems, pp. 309\u2013316","DOI":"10.1145\/2959100.2959152"},{"key":"406_CR67","doi-asserted-by":"crossref","unstructured":"Xun J, Zhang S, Zhao Z, Zhu J, Zhang Q, Li J, He X, He X, Chua T.-S, Wu F (2021) Why do we click: visual impression-aware news recommendation. In: Proceedings of the 29th ACM International Conference on Multimedia, pp. 3881\u20133890","DOI":"10.1145\/3474085.3475514"},{"key":"406_CR68","doi-asserted-by":"crossref","unstructured":"Tian J, Wang Z, Zhao J, Ding Z (2024) Mmrec: Llm based multi-modal recommender system. In: 2024 19th International Workshop on Semantic and Social Media Adaptation & Personalization (SMAP), pp. 105\u2013110. IEEE","DOI":"10.1109\/SMAP63474.2024.00028"},{"key":"406_CR69","doi-asserted-by":"crossref","unstructured":"Kim Y, Kim T, Shin W.-Y, Kim S.-W (2024) Monet: Modality-embracing graph convolutional network and target-aware attention for multimedia recommendation. In: Proceedings of the 17th ACM International Conference on Web Search and Data Mining, pp. 332\u2013340","DOI":"10.1145\/3616855.3635817"},{"key":"406_CR70","doi-asserted-by":"crossref","unstructured":"Ong RK, Khong AW (2025) Spectrum-based modality representation fusion graph convolutional network for multimodal recommendation. Proceedings of the Eighteenth ACM International Conference on Web Search and Data Mining. pp 773\u2013781","DOI":"10.1145\/3701551.3703561"},{"key":"406_CR71","unstructured":"Dong X, Song X, Zheng N, Zhao S, Ding G (2025) Modality reliability guided multimodal recommendation.(arXiv preprint)"},{"key":"406_CR72","doi-asserted-by":"crossref","unstructured":"Yi Z, Wang X, Ounis I, Macdonald C (2022) Multi-modal graph contrastive learning for micro-video recommendation. Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval. pp 1807\u20131811","DOI":"10.1145\/3477495.3532027"},{"key":"406_CR73","doi-asserted-by":"crossref","unstructured":"Lin Z, Tan Y, Zhan Y, Liu W, Wang F, Chen C, Wang S, Yang C (2023) Contrastive intra-and inter-modality generation for enhancing incomplete multimedia recommendation. In: Proceedings of the 31st ACM International Conference on Multimedia, pp. 6234\u20136242","DOI":"10.1145\/3581783.3612362"},{"key":"406_CR74","doi-asserted-by":"publisher","first-page":"5107","DOI":"10.1109\/TMM.2022.3187556","volume":"25","author":"Z Tao","year":"2022","unstructured":"Tao Z, Liu X, Xia Y, Wang X, Yang L, Huang X, Chua T-S (2022) Self-supervised learning for multimedia recommendation. IEEE Trans Multimedia 25:5107\u20135116","journal-title":"IEEE Trans Multimedia"},{"key":"406_CR75","doi-asserted-by":"crossref","unstructured":"Kang W.-C, Fang C, Wang Z, McAuley J (2017) Visually-aware fashion recommendation and design with generative image models. In: 2017 IEEE International Conference on Data Mining (ICDM), pp. 207\u2013216 . IEEE","DOI":"10.1109\/ICDM.2017.30"},{"key":"406_CR76","doi-asserted-by":"crossref","unstructured":"Li J, Wang S, Zhang Q, Yu S, Chen F (2025) Generating with fairness: A modality-diffused counterfactual framework for incomplete multimodal recommendations. Proceedings of the ACM on Web Conference 2025. pp 2787\u20132798","DOI":"10.1145\/3696410.3714606"},{"key":"406_CR77","doi-asserted-by":"publisher","first-page":"9343","DOI":"10.1109\/TMM.2023.3251108","volume":"25","author":"K Liu","year":"2023","unstructured":"Liu K, Xue F, Guo D, Sun P, Qian S, Hong R (2023) Multimodal graph contrastive learning for multimedia-based recommendation. IEEE Trans Multimedia 25:9343\u20139355","journal-title":"IEEE Trans Multimedia"},{"key":"406_CR78","doi-asserted-by":"crossref","unstructured":"Zhou X, Zhou H, Liu Y, Zeng Z, Miao C, Wang P, You Y, Jiang F (2023) Bootstrap latent representations for multi-modal recommendation. In: Proceedings of the ACM Web Conference 2023, pp. 845\u2013854","DOI":"10.1145\/3543507.3583251"},{"key":"406_CR79","unstructured":"Wu X, Huang A, Yang H, He H, Tai Y, Zhang W (2024) Towards bridging the cross-modal semantic gap for multi-modal recommendation.(arXiv preprint)"},{"key":"406_CR80","doi-asserted-by":"crossref","unstructured":"Girdhar R, El-Nouby A, Liu Z, Singh M, Alwala KV, Joulin A, Misra I (2023) Imagebind: One embedding space to bind them all. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. pp 15180\u201315190","DOI":"10.1109\/CVPR52729.2023.01457"},{"key":"406_CR81","unstructured":"Daunhawer I, Bizeul A, Palumbo E, Marx A, Vogt JE (2023) Identifiability results for multimodal contrastive learning. International Conference on Learning Representations (ICLR"},{"issue":"6","key":"406_CR82","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1007\/s00138-021-01249-8","volume":"32","author":"SY Boulahia","year":"2021","unstructured":"Boulahia SY, Amamra A, Madi MR, Daikh S (2021) Early, intermediate and late fusion strategies for robust deep learning-based multimodal action recognition. Mach Vis Appl 32(6):121","journal-title":"Mach Vis Appl"},{"issue":"8","key":"406_CR83","doi-asserted-by":"publisher","first-page":"30","DOI":"10.1109\/MC.2009.263","volume":"42","author":"Y Koren","year":"2009","unstructured":"Koren Y, Bell R, Volinsky C (2009) Matrix factorization techniques for recommender systems. Computer 42(8):30\u201337","journal-title":"Computer"},{"key":"406_CR84","doi-asserted-by":"crossref","unstructured":"Agarwal D, Chen B-C (2009) Regression-based latent factor models. Proceedings of the 15th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining. pp 19\u201328","DOI":"10.1145\/1557019.1557029"},{"key":"406_CR85","doi-asserted-by":"crossref","unstructured":"Rendle S (2010) Factorization machines. 2010 IEEE International Conference on Data Mining. IEEE, pp 995\u20131000","DOI":"10.1109\/ICDM.2010.127"},{"key":"406_CR86","doi-asserted-by":"crossref","unstructured":"Wang C, Blei DM (2011) Collaborative topic modeling for recommending scientific articles. Proceedings of the 17th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining. pp 448\u2013456","DOI":"10.1145\/2020408.2020480"},{"key":"406_CR87","doi-asserted-by":"crossref","unstructured":"McAuley J, Leskovec J (2013) Hidden factors and hidden topics: understanding rating dimensions with review text. In: Proceedings of the 7th ACM Conference on Recommender Systems, pp. 165\u2013172","DOI":"10.1145\/2507157.2507163"},{"key":"406_CR88","doi-asserted-by":"crossref","unstructured":"Sedhain S, Sanner S, Braziunas D, Xie L, Christensen J (2014) Social collaborative filtering for cold-start recommendations. Proceedings of the 8th ACM Conference on Recommender Systems. pp 345\u2013348","DOI":"10.1145\/2645710.2645772"},{"key":"406_CR89","doi-asserted-by":"crossref","unstructured":"Wang H, Wang N, Yeung D.-Y (2015) Collaborative deep learning for recommender systems. In: Proceedings of the 21th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 1235\u20131244","DOI":"10.1145\/2783258.2783273"},{"key":"406_CR90","doi-asserted-by":"crossref","unstructured":"Liang J, Zhao X, Li M, Zhang Z, Wang W, Liu H, Liu Z (2023) Mmmlp: Multi-modal multilayer perceptron for sequential recommendations. In: Proceedings of the ACM Web Conference 2023, pp. 1109\u20131117","DOI":"10.1145\/3543507.3583378"},{"issue":"2","key":"406_CR91","first-page":"1","volume":"42","author":"H Liu","year":"2023","unstructured":"Liu H, Wei Y, Liu F, Wang W, Nie L, Chua T-S (2023) Dynamic multimodal fusion via meta-learning towards micro-video recommendation. ACM Transactions on Information Systems 42(2):1\u201326","journal-title":"ACM Transactions on Information Systems"},{"key":"406_CR92","doi-asserted-by":"crossref","unstructured":"Huang J, Qin J, Yu Y, Zhang W (2025) Beyond graph convolution: Multimodal recommendation with topology-aware mlps. Proceedings of the AAAI Conference on Artificial Intelligence, vol 39. pp 11808\u201311816","DOI":"10.1609\/aaai.v39i11.33285"},{"issue":"5","key":"406_CR93","doi-asserted-by":"publisher","first-page":"2907","DOI":"10.3390\/su14052907","volume":"14","author":"X Ren","year":"2022","unstructured":"Ren X, Yang W, Jiang X, Jin G, Yu Y (2022) A deep learning framework for multimodal course recommendation based on lstm+ attention. Sustainability 14(5):2907","journal-title":"Sustainability"},{"key":"406_CR94","doi-asserted-by":"crossref","unstructured":"Chen X, Chen H, Xu H, Zhang Y, Cao Y, Qin Z, Zha H (2019) Personalized fashion recommendation with visual explanations based on multimodal attention network: Towards visually explainable recommendation. In: Proceedings of the 42nd International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 765\u2013774","DOI":"10.1145\/3331184.3331254"},{"issue":"3","key":"406_CR95","doi-asserted-by":"publisher","first-page":"768","DOI":"10.1109\/TCSS.2020.2986778","volume":"7","author":"Q Yang","year":"2020","unstructured":"Yang Q, Wu G, Li Y, Li R, Gu X, Deng H, Wu J (2020) Amnn: Attention-based multimodal neural network model for hashtag recommendation. IEEE Transactions on Computational Social Systems 7(3):768\u2013779","journal-title":"IEEE Transactions on Computational Social Systems"},{"key":"406_CR96","doi-asserted-by":"publisher","first-page":"120023","DOI":"10.1109\/ACCESS.2022.3221812","volume":"10","author":"S Kitada","year":"2022","unstructured":"Kitada S, Iwazaki Y, Togashi R, Iyatomi H (2022) Dm 2 s 2: Deep multimodal sequence sets with hierarchical modality attention. IEEE Access 10:120023\u2013120034","journal-title":"IEEE Access"},{"key":"406_CR97","unstructured":"Burabak M, Aytekin T (2024) Synergraph: An integrated graph convolution network for multimodal recommendation.(arXiv preprint)"},{"key":"406_CR98","doi-asserted-by":"crossref","unstructured":"Yi Z, Ounis I (2024) A unified graph transformer for overcoming isolations in multi-modal recommendation. Proceedings of the 18th ACM Conference on Recommender Systems. pp 518\u2013527","DOI":"10.1145\/3640457.3688096"},{"key":"406_CR99","doi-asserted-by":"crossref","unstructured":"Zhou H, Wang Y, Zhan H (2025) Mde: Modality discrimination enhancement for multi-modal recommendation.(arXiv preprint)","DOI":"10.1109\/ISCAS56072.2025.11043966"},{"key":"406_CR100","doi-asserted-by":"publisher","first-page":"7543","DOI":"10.1109\/TMM.2024.3369875","volume":"26","author":"X Zhou","year":"2024","unstructured":"Zhou X, Miao C (2024) Disentangled graph variational auto-encoder for multimodal recommendation with interpretability. IEEE Trans Multimedia 26:7543\u20137554","journal-title":"IEEE Trans Multimedia"},{"key":"406_CR101","doi-asserted-by":"crossref","unstructured":"Ma H, Yang Y, Meng L, Xie R, Meng X (2024) Multimodal conditioned diffusion model for recommendation. In: Companion Proceedings of the ACM Web Conference 2024, pp. 1733\u20131740","DOI":"10.1145\/3589335.3651956"},{"key":"406_CR102","unstructured":"Jiang J, Huang Y, Liu B, Kong X, Xu Z, Zhu H, Xu J, Zheng B (2025) Large language model as universal retriever in industrial-scale recommender system. arXiv preprint arXiv:2502.03041"},{"key":"406_CR103","unstructured":"Huang C, Wu J, Xia Y, Yu Z, Wang R, Yu T, Zhang R, Rossi R.A, Kveton B, Zhou D, et al (2025) Towards agentic recommender systems in the era of multimodal large language models. arXiv preprint arXiv:2503.16734"},{"issue":"9","key":"406_CR104","first-page":"1","volume":"21","author":"X Liu","year":"2025","unstructured":"Liu X, Song Q, Xiao L, Wang C, Gao X (2025) Lpic: Learnable prompts and id-guided contrastive learning for multimodal recommendation. ACM Trans Multimed Comput Commun Appl 21(9):1\u201316","journal-title":"ACM Trans Multimed Comput Commun Appl"},{"key":"406_CR105","doi-asserted-by":"crossref","unstructured":"Yang Y, Ma H, Meng L, Xu S, Xie R, Meng X (2025) Curriculum conditioned diffusion for multimodal recommendation. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 39, pp. 13035\u201313043","DOI":"10.1609\/aaai.v39i12.33422"},{"key":"406_CR106","doi-asserted-by":"crossref","unstructured":"Zhang F, Chen J, Li H, Wang S, Cao Y, Wei K, He J, Kou F, Wang J (2025) Leveraging multimodal data and side users for diffusion cross-domain recommendation. arXiv preprint arXiv:2507.04000","DOI":"10.1145\/3746027.3754555"},{"key":"406_CR107","doi-asserted-by":"crossref","unstructured":"Wei Y, Wang X, Nie L, He X, Chua T-S (2020) Graph-refined convolutional network for multimedia recommendation with implicit feedback. Proceedings of the 28th ACM International Conference on Multimedia. pp 3541\u20133549","DOI":"10.1145\/3394171.3413556"},{"key":"406_CR108","doi-asserted-by":"crossref","unstructured":"Yang W, Yang J, Liu Y (2023) Multimodal optimal transport knowledge distillation for cross-domain recommendation. In: Proceedings of the 32nd ACM International Conference on Information and Knowledge Management, pp. 2959\u20132968","DOI":"10.1145\/3583780.3614983"},{"key":"406_CR109","unstructured":"Zhang W, Luo J, Zhang X, Fang Y (2025) Bridging domain gaps between pretrained multimodal models and recommendations. arXiv preprint arXiv:2502.15542"},{"key":"406_CR110","doi-asserted-by":"crossref","unstructured":"Ji W, Liu X, Zhang A, Wei Y, Ni Y, Wang X (2023) Online distillation-enhanced multi-modal transformer for sequential recommendation. Proceedings of the 31st ACM International Conference on Multimedia. pp 955\u2013965","DOI":"10.1145\/3581783.3612091"},{"key":"406_CR111","unstructured":"He Z, Wang Z, Yang Y, Bai H, Wu L (2024) It is never too late to mend: Separate learning for multimedia recommendation.(arXiv preprint)"},{"key":"406_CR112","doi-asserted-by":"crossref","unstructured":"Ni Y, Cheng Y, Liu X, Fu J, Li Y, He X, Zhang Y, Yuan F (2025) A content-driven micro-video recommendation dataset at scale. Proceedings of the 34th ACM International Conference on Information and Knowledge Management","DOI":"10.1145\/3746252.3761655"},{"key":"406_CR113","doi-asserted-by":"crossref","unstructured":"Shang Y, Gao C, Li N, Li Y (2025) A large-scale dataset with behavior, attributes, and content of mobile short-video platform. In: Companion Proceedings of the ACM Web Conference 2025, pp. 793\u2013796","DOI":"10.1145\/3701716.3715296"},{"key":"406_CR114","doi-asserted-by":"publisher","first-page":"1246","DOI":"10.7717\/peerj-cs.1246","volume":"9","author":"W Zhang","year":"2023","unstructured":"Zhang W (2023) Design of news recommendation model based on sub-attention news encoder. PeerJ Computer Science 9:1246","journal-title":"PeerJ Computer Science"},{"key":"406_CR115","doi-asserted-by":"crossref","unstructured":"Borg Bruun S, Balog K, Maistro M (2024) Dataset and models for item recommendation using multi-modal user interactions. Proceedings of the 47th International ACM SIGIR Conference on Research and Development in Information Retrieval. pp 709\u2013718","DOI":"10.1145\/3626772.3657881"},{"key":"406_CR116","doi-asserted-by":"crossref","unstructured":"Attimonelli M, Danese D, Di Fazio A, Malitesta D, Pomo C, Di Noia T (2024) Ducho meets elliot: Large-scale benchmarks for multimodal recommendation.(arXiv preprint)","DOI":"10.2139\/ssrn.5349267"},{"issue":"1","key":"406_CR117","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1145\/963770.963772","volume":"22","author":"JL Herlocker","year":"2004","unstructured":"Herlocker JL, Konstan JA, Terveen LG, Riedl JT (2004) Evaluating collaborative filtering recommender systems. ACM Transactions on Information Systems (TOIS) 22(1):5\u201353","journal-title":"ACM Transactions on Information Systems (TOIS)"},{"issue":"4","key":"406_CR118","doi-asserted-by":"publisher","first-page":"422","DOI":"10.1145\/582415.582418","volume":"20","author":"K J\u00e4rvelin","year":"2002","unstructured":"J\u00e4rvelin K, Kek\u00e4l\u00e4inen J (2002) Cumulated gain-based evaluation of ir techniques. ACM Transactions on Information Systems (TOIS) 20(4):422\u2013446","journal-title":"ACM Transactions on Information Systems (TOIS)"},{"key":"406_CR119","unstructured":"Castells P, Vargas S, Wang J (2011) Novelty and diversity metrics for recommender systems: choice, discovery and relevance. International Workshop on Diversity in Document Retrieval (DDR 2011) at the 33rd European Conference on Information Retrieval (ECIR 2011). Citeseer, pp 29\u201336"},{"key":"406_CR120","doi-asserted-by":"crossref","unstructured":"Parapar J, Radlinski F (2021) Towards unified metrics for accuracy and diversity for recommender systems. Proceedings of the 15th ACM Conference on Recommender Systems. pp 75\u201384","DOI":"10.1145\/3460231.3474234"},{"issue":"8","key":"406_CR121","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3556536","volume":"55","author":"E Zangerle","year":"2022","unstructured":"Zangerle E, Bauer C (2022) Evaluating recommender systems: survey and framework. ACM Comput Surv 55(8):1\u201338","journal-title":"ACM Comput Surv"},{"key":"406_CR122","unstructured":"Kornblith S, Norouzi M, Lee H, Hinton G (2019) Similarity of neural network representations revisited. International Conference on Machine Learning. pp 3519\u20133529 (PMLR)"},{"key":"406_CR123","doi-asserted-by":"crossref","unstructured":"Labbaki S, Minary P Orthogonal sequential fusion in multimodal learning. Proceedings of the 28th International Conference on Information Fusion (FUSION) (2025). IEEE","DOI":"10.23919\/FUSION65864.2025.11124022"},{"key":"406_CR124","unstructured":"Lundberg SM, Lee S-I (2017) A unified approach to interpreting model predictions. Advances in Neural Information Processing Systems, vol 30"},{"key":"406_CR125","unstructured":"Sundararajan M, Taly A, Yan Q (2017) Axiomatic attribution for deep networks. Proceedings of the 34th International Conference on Machine Learning. PMLR, vol 70. pp 3319\u20133328"},{"key":"406_CR126","doi-asserted-by":"crossref","unstructured":"Zhu F, Wang Y, Chen C, Zhou J, Li L, Liu G (2021) Cross-domain recommendation: challenges, progress, and prospects. In: Proceedings of the Thirtieth International Joint Conference on Artificial Intelligence (IJCAI-21), pp. 4721\u20134728","DOI":"10.24963\/ijcai.2021\/639"},{"key":"406_CR127","doi-asserted-by":"publisher","DOI":"10.1016\/j.bdr.2023.100380","volume":"32","author":"J Peng","year":"2023","unstructured":"Peng J, Hu X, Huang W, Yang J (2023) What is a multi-modal knowledge graph: A survey. Big Data Research 32:100380","journal-title":"Big Data Research"}],"container-title":["International Journal of Multimedia Information Retrieval"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s13735-026-00406-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s13735-026-00406-x","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s13735-026-00406-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,19]],"date-time":"2026-05-19T16:22:56Z","timestamp":1779207776000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s13735-026-00406-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,5,19]]},"references-count":127,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2026,6]]}},"alternative-id":["406"],"URL":"https:\/\/doi.org\/10.1007\/s13735-026-00406-x","relation":{},"ISSN":["2192-6611","2192-662X"],"issn-type":[{"value":"2192-6611","type":"print"},{"value":"2192-662X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,5,19]]},"assertion":[{"value":"24 October 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 April 2026","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 May 2026","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 May 2026","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflicts of Interest"}},{"value":"The authors declare no competing interests.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"12"}}