{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T17:08:53Z","timestamp":1777655333741,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":71,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,7,13]]},"DOI":"10.1145\/3726302.3729906","type":"proceedings-article","created":{"date-parts":[[2025,7,14]],"date-time":"2025-07-14T01:18:36Z","timestamp":1752455916000},"page":"989-999","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["Boosting Discriminability for Robust Multimodal Entity Linking with Visual Modality Missing"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8413-7220","authenticated-orcid":false,"given":"Mingrui","family":"Lao","sequence":"first","affiliation":[{"name":"National Key Laboratory of Information Systems Engineering, NUDT, Changsha, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-8789-7413","authenticated-orcid":false,"given":"Zheng","family":"Li","sequence":"additional","affiliation":[{"name":"Laboratory for Big Data and Decision, NUDT, Changsha, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9184-5313","authenticated-orcid":false,"given":"Yanming","family":"Guo","sequence":"additional","affiliation":[{"name":"Laboratory for Big Data and Decision, NUDT, Changsha, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-2861-633X","authenticated-orcid":false,"given":"Xueyi","family":"Zhang","sequence":"additional","affiliation":[{"name":"Laboratory for Big Data and Decision, NUDT, Changsha, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8012-6820","authenticated-orcid":false,"given":"Siqi","family":"Cai","sequence":"additional","affiliation":[{"name":"National University of Singapore, Singapore, Singapore"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3657-292X","authenticated-orcid":false,"given":"Zhaoyun","family":"Ding","sequence":"additional","affiliation":[{"name":"National Key Laboratory of Information Systems Engineering, NUDT, Changsha, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9158-9401","authenticated-orcid":false,"given":"Haizhou","family":"Li","sequence":"additional","affiliation":[{"name":"The Chinese University of Hong Kong, Shenzhen, Shenzhen, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,7,13]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Herv\u00e9 Le Borgne, and Brigitte Grau","author":"Adjali Omar","year":"2020","unstructured":"Omar Adjali, Romaric Besan\u00e7on, Olivier Ferret, Herv\u00e9 Le Borgne, and Brigitte Grau. 2020. Building a multimodal entity linking dataset from tweets. In Proceed- ings of the Twelfth Language Resources and Evaluation Conference. 4285-4292."},{"key":"e_1_3_2_1_2_1","article-title":"The question answering systems: A survey","volume":"2","author":"Nabil Allam Ali Mohamed","year":"2012","unstructured":"Ali Mohamed Nabil Allam and Mohamed Hassan Haggag. 2012. The question answering systems: A survey. International Journal of Research and Reviews in Information Sciences (IJRRIS) 2, 3 (2012).","journal-title":"International Journal of Research and Reviews in Information Sciences (IJRRIS)"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.279"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/792548.611918"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/3626772.3658596"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW63382.2024.00127"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/2684822.2685317"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3219963"},{"key":"e_1_3_2_1_9_1","volume-title":"Mario Valerio Giuffrida, and Sotirios A Tsaf- taris","author":"Chartsias Agisilaos","year":"2017","unstructured":"Agisilaos Chartsias, Thomas Joyce, Mario Valerio Giuffrida, and Sotirios A Tsaf- taris. 2017. Multimodal MR synthesis via modality-invariant latent representation. IEEE transactions on medical imaging 37, 3 (2017), 803-814."},{"key":"e_1_3_2_1_10_1","volume-title":"Learning with privileged multimodal knowledge for unimodal segmentation","author":"Chen Cheng","year":"2021","unstructured":"Cheng Chen, Qi Dou, Yueming Jin, Quande Liu, and Pheng Ann Heng. 2021. Learning with privileged multimodal knowledge for unimodal segmentation. IEEE transactions on medical imaging 41, 3 (2021), 621-632."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/3166054.3166058"},{"key":"e_1_3_2_1_12_1","first-page":"36218","article-title":"Probabilistic Conformal Distillation for Enhancing Missing Modality Robustness","volume":"37","author":"Chen Mengxi","year":"2024","unstructured":"Mengxi Chen, Fei Zhang, Zihua Zhao, Jiangchao Yao, Ya Zhang, and Yanfeng Wang. 2024. Probabilistic Conformal Distillation for Enhancing Missing Modality Robustness. Advances in Neural Information Processing Systems 37 (2024), 36218- 36242.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_13_1","volume-title":"Disentangle first, then distill: A unified framework for missing modality imputation and Alzheimer's disease diagnosis","author":"Chen Yuanyuan","year":"2023","unstructured":"Yuanyuan Chen, Yongsheng Pan, Yong Xia, and Yixuan Yuan. 2023. Disentangle first, then distill: A unified framework for missing modality imputation and Alzheimer's disease diagnosis. IEEE Transactions on Medical Imaging (2023)."},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.121"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.findings-emnlp.230"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2022.09.025"},{"key":"e_1_3_2_1_17_1","volume-title":"Conference on Empirical Methods in Natural Language Processing. https:\/\/api.semanticscholar.org\/CorpusID:1356505","author":"Ganea Octavian-Eugen","year":"2017","unstructured":"Octavian-Eugen Ganea and Thomas Hofmann. 2017. Deep Joint Entity Disam- biguation with Local Neural Attention. In Conference on Empirical Methods in Natural Language Processing. https:\/\/api.semanticscholar.org\/CorpusID:1356505"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/3640457.3688138"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ipm.2019.102067"},{"key":"e_1_3_2_1_20_1","volume-title":"Proceedings of the 2017 conference on empirical methods in natural language processing. 2681-2690","author":"Gupta Nitish","year":"2017","unstructured":"Nitish Gupta, Sameer Singh, and Dan Roth. 2017. Entity linking via joint encod- ing of types, descriptions, and context. In Proceedings of the 2017 conference on empirical methods in natural language processing. 2681-2690."},{"key":"e_1_3_2_1_21_1","first-page":"33716","article-title":"Knowledge distillation from a stronger teacher","volume":"35","author":"Huang Tao","year":"2022","unstructured":"Tao Huang, Shan You, Fei Wang, Chen Qian, and Chang Xu. 2022. Knowledge distillation from a stronger teacher. Advances in Neural Information Processing Systems 35 (2022), 33716-33727.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01100"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3612291"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00650"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1145\/3474085.3475492"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2020.10.071"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i11.26527"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3612121"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01435"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2023.102869"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2020.105592"},{"key":"e_1_3_2_1_32_1","volume-title":"Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 12458-12468","author":"Li Mingcheng","year":"2024","unstructured":"Mingcheng Li, Dingkang Yang, Xiao Zhao, Shuaibing Wang, Yan Wang, Kun Yang, Mingyang Sun, Dongliang Kou, Ziyun Qian, and Lihua Zhang. 2024. Correlation- Decoupled Knowledge Distillation for Multimodal Sentiment Analysis with In- complete Modalities. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 12458-12468."},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2020.3046855"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2023.101973"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3681661"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1145\/3580305.3599439"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1145\/3627673.3679898"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/TMI.2024.3368664"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1186"},{"key":"e_1_3_2_1_40_1","volume-title":"Learning Trimodal Relation for Audio-Visual Question Answering with Missing Modality. In European Conference on Computer Vision. Springer, 42-59","author":"Park Kyu Ri","year":"2025","unstructured":"Kyu Ri Park, Hong Joo Lee, and Jung Uk Kim. 2025. Learning Trimodal Relation for Audio-Visual Question Answering with Missing Modality. In European Conference on Computer Vision. Springer, 42-59."},{"key":"e_1_3_2_1_41_1","volume-title":"ICASSP 2024-2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). IEEE, 5755-5759","author":"Park Kyu Ri","year":"2024","unstructured":"Kyu Ri Park, Youngmin Oh, and Jung Uk Kim. 2024. Enhancing Audio-Visual Question Answering with Missing Modality via Trans-Modal Associative Learn- ing. In ICASSP 2024-2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). IEEE, 5755-5759."},{"key":"e_1_3_2_1_42_1","volume-title":"International conference on machine learning. PMLR, 8748-8763","author":"Radford Alec","year":"2021","unstructured":"Alec Radford, Jong Wook Kim, Chris Hallacy, Aditya Ramesh, Gabriel Goh, Sandhini Agarwal, Girish Sastry, Amanda Askell, Pamela Mishkin, Jack Clark, et al. 2021. Learning transferable visual models from natural language supervision. In International conference on machine learning. PMLR, 8748-8763."},{"key":"e_1_3_2_1_43_1","first-page":"73","article-title":"An overview of semantic search engines","volume":"6","author":"Roy Subham","year":"2019","unstructured":"Subham Roy, Akshay Modak, Debabrata Barik, and Surajit Goon. 2019. An overview of semantic search engines. Int. J. Res. Rev 6, 10 (2019), 73-85.","journal-title":"Int. J. Res. Rev"},{"key":"e_1_3_2_1_44_1","first-page":"2556","article-title":"Entity linking meets deep learning: Techniques and solutions","volume":"35","author":"Shen Wei","year":"2021","unstructured":"Wei Shen, Yuhan Li, Yinan Liu, Jiawei Han, Jianyong Wang, and Xiaojie Yuan. 2021. Entity linking meets deep learning: Techniques and solutions. IEEE Trans- actions on Knowledge and Data Engineering 35, 3 (2021), 2556-2578.","journal-title":"IEEE Trans- actions on Knowledge and Data Engineering"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2014.2327028"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i17.29867"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-acl.46"},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01489"},{"key":"e_1_3_2_1_49_1","unstructured":"Yaming Sun Lei Lin Duyu Tang Nan Yang Zhenzhou Ji and Xiaolong Wang. 2015. Modeling mention context and entity with neural networks for entity disambiguation. In Twenty-fourth international joint conference on artificial intel- ligence."},{"key":"e_1_3_2_1_50_1","volume-title":"Any-to-any generation via composable diffusion. Advances in Neural Information Processing Systems 36","author":"Tang Zineng","year":"2024","unstructured":"Zineng Tang, Ziyi Yang, Chenguang Zhu, Michael Zeng, and Mohit Bansal. 2024. Any-to-any generation via composable diffusion. Advances in Neural Information Processing Systems 36 (2024)."},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ipm.2020.102277"},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.1145\/3711121"},{"key":"e_1_3_2_1_53_1","volume-title":"Proceedings of the IEEE conference on computer vision and pattern recognition. 1405-1414","author":"Tran Luan","year":"2017","unstructured":"Luan Tran, Xiaoming Liu, Jiayu Zhou, and Rong Jin. 2017. Missing modalities im- putation via cascaded residual autoencoder. In Proceedings of the IEEE conference on computer vision and pattern recognition. 1405-1414."},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01524"},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-43901-8_21"},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.bdr.2020.100159"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"publisher","DOI":"10.1145\/3477495.3531867"},{"key":"e_1_3_2_1_58_1","doi-asserted-by":"crossref","unstructured":"Xuwu Wang Junfeng Tian Min Gui Zhixu Li Rui Wang Ming Yan Lihan Chen and Yanghua Xiao. 2022. WikiDiverse: A Multimodal Entity Linking Dataset with Diversified Contextual Topics and Entity Types. In Annual Meeting of the Association for Computational Linguistics. https:\/\/api.semanticscholar.org\/ CorpusID:248157348","DOI":"10.18653\/v1\/2022.acl-long.328"},{"key":"e_1_3_2_1_59_1","volume-title":"Deep multimodal fusion by channel exchanging. Advances in neural information processing systems 33","author":"Wang Yikai","year":"2020","unstructured":"Yikai Wang, Wenbing Huang, Fuchun Sun, Tingyang Xu, Yu Rong, and Junzhou Huang. 2020. Deep multimodal fusion by channel exchanging. Advances in neural information processing systems 33 (2020), 4835-4845."},{"key":"e_1_3_2_1_60_1","first-page":"17117","article-title":"Incomplete multimodality-diffused emotion recognition","volume":"36","author":"Wang Yuanzhi","year":"2023","unstructured":"Yuanzhi Wang, Yong Li, and Zhen Cui. 2023. Incomplete multimodality-diffused emotion recognition. Advances in Neural Information Processing Systems 36 (2023), 17117-17128.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_61_1","volume-title":"International Conference on Machine Learning. PMLR, 10334-10343","author":"Woodworth Blake","year":"2020","unstructured":"Blake Woodworth, Kumar Kshitij Patel, Sebastian Stich, Zhen Dai, Brian Bullins, Brendan Mcmahan, Ohad Shamir, and Nathan Srebro. 2020. Is local SGD better than minibatch SGD?. In International Conference on Machine Learning. PMLR, 10334-10343."},{"key":"e_1_3_2_1_62_1","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3612575"},{"key":"e_1_3_2_1_63_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11704-024-40555-y"},{"key":"e_1_3_2_1_64_1","first-page":"1006","article-title":"Incomplete learning of multi-modal connectome for brain disorder diagnosis via modal-mixup and deep supervision","author":"Yang Yanwu","year":"2024","unstructured":"Yanwu Yang, Hairui Chen, Zhikai Chang, Yang Xiang, Chenfei Ye, and Ting Ma. 2024. Incomplete learning of multi-modal connectome for brain disorder diagnosis via modal-mixup and deep supervision. In Medical Imaging With Deep Learning. PMLR, 1006-1018.","journal-title":"Medical Imaging With Deep Learning. PMLR"},{"key":"e_1_3_2_1_65_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neuroimage.2012.03.059"},{"key":"e_1_3_2_1_66_1","doi-asserted-by":"publisher","DOI":"10.1145\/3477495.3532064"},{"key":"e_1_3_2_1_67_1","doi-asserted-by":"publisher","DOI":"10.1145\/3534678.3539388"},{"key":"e_1_3_2_1_68_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-30675-4_45"},{"key":"e_1_3_2_1_69_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-73197-7_35"},{"key":"e_1_3_2_1_70_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-acl.243"},{"key":"e_1_3_2_1_71_1","volume-title":"Towards un- derstanding convergence and generalization of AdamW","author":"Zhou Pan","year":"2024","unstructured":"Pan Zhou, Xingyu Xie, Zhouchen Lin, and Shuicheng Yan. 2024. Towards un- derstanding convergence and generalization of AdamW. IEEE Transactions on Pattern Analysis and Machine Intelligence (2024)."}],"event":{"name":"SIGIR '25: The 48th International ACM SIGIR Conference on Research and Development in Information Retrieval","location":"Padua Italy","acronym":"SIGIR '25","sponsor":["SIGIR ACM Special Interest Group on Information Retrieval"]},"container-title":["Proceedings of the 48th International ACM SIGIR Conference on Research and Development in Information Retrieval"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3726302.3729906","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T18:29:15Z","timestamp":1755887355000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3726302.3729906"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,7,13]]},"references-count":71,"alternative-id":["10.1145\/3726302.3729906","10.1145\/3726302"],"URL":"https:\/\/doi.org\/10.1145\/3726302.3729906","relation":{},"subject":[],"published":{"date-parts":[[2025,7,13]]},"assertion":[{"value":"2025-07-13","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}