{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T15:56:51Z","timestamp":1781539011180,"version":"3.54.5"},"publisher-location":"New York, NY, USA","reference-count":45,"publisher":"ACM","license":[{"start":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T00:00:00Z","timestamp":1781481600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"name":"Major Projects of the Educational Sciences Plan of Beijing Municipality","award":["AMAA25002"],"award-info":[{"award-number":["AMAA25002"]}]},{"name":"Beijing Natural Science Foundation","award":["QY25393"],"award-info":[{"award-number":["QY25393"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,6,16]]},"DOI":"10.1145\/3805622.3810820","type":"proceedings-article","created":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T14:42:57Z","timestamp":1781534577000},"page":"147-156","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["LSR\u00b2: Learning to Select Relational and Reasoning Feature for Multi-modal Re-identification"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0004-6879-9135","authenticated-orcid":false,"given":"Peng","family":"Jin","sequence":"first","affiliation":[{"name":"Capital Normal University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1573-8919","authenticated-orcid":false,"given":"Yuxuan","family":"Qiu","sequence":"additional","affiliation":[{"name":"Capital Normal University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-9632-0271","authenticated-orcid":false,"given":"Zhaofa","family":"Wang","sequence":"additional","affiliation":[{"name":"Capital Normal University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-7433-1839","authenticated-orcid":false,"given":"Xiaoyue","family":"Hu","sequence":"additional","affiliation":[{"name":"Capital Normal University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6497-8118","authenticated-orcid":false,"given":"Xiabing","family":"Zhou","sequence":"additional","affiliation":[{"name":"Capital Normal University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2239-1121","authenticated-orcid":false,"given":"Na","family":"Jiang","sequence":"additional","affiliation":[{"name":"Capital Normal University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2026,6,15]]},"reference":[{"key":"e_1_3_3_1_2_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02534"},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01449"},{"key":"e_1_3_3_1_4_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01027"},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"publisher","unstructured":"Wenjiao Dong Xi Yang De Cheng Nannan Wang and Xinbo Gao. 2025. Escaping Modal Interactions: An Efficient DESANet for Multi-Modal Object Re-Identification. IEEE Trans. Image Process. 34 (2025) 5068\u20135083. 10.1109\/TIP.2025.3592575","DOI":"10.1109\/TIP.2025.3592575"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01035"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"publisher","unstructured":"Yingying Feng Jie Li Jie Hu Yukang Zhang Lei Tan and Jiayi Ji. 2025. MDReID: Modality-Decoupled Learning for Any-to-Any Multi-Modal Object Re-Identification. CoRR abs\/2510.23301 (2025). arXiv:https:\/\/arXiv.org\/abs\/2510.2330110.48550\/ARXIV.2510.23301","DOI":"10.48550\/ARXIV.2510.23301"},{"key":"e_1_3_3_1_8_2","series-title":"Proceedings of Machine Learning Research","volume-title":"Forty-second International Conference on Machine Learning, ICML 2025, Vancouver, BC, Canada, July 13-19, 2025","volume":"267","author":"Feng Yingying","year":"2025","unstructured":"Yingying Feng, Jie Li, Chi Xie, Lei Tan, and Jiayi Ji. 2025. Multi-Modal Object Re-identification via Sparse Mixture-of-Experts. In Forty-second International Conference on Machine Learning, ICML 2025, Vancouver, BC, Canada, July 13-19, 2025(Proceedings of Machine Learning Research, Vol.\u00a0267), Aarti Singh, Maryam Fazel, Daniel Hsu, Simon Lacoste-Julien, Felix Berkenkamp, Tegan Maharaj, Kiri Wagstaff, and Jerry Zhu (Eds.). PMLR \/ OpenReview.net. https:\/\/proceedings.mlr.press\/v267\/feng25i.html"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICSP54964.2022.9778769"},{"key":"e_1_3_3_1_10_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICSP58490.2023.10248672"},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"publisher","unstructured":"Robert\u00a0A. Jacobs Michael\u00a0I. Jordan Steven\u00a0J. Nowlan and Geoffrey\u00a0E. Hinton. 1991. Adaptive Mixtures of Local Experts. Neural Comput. 3 1 (1991) 79\u201387. 10.1162\/NECO.1991.3.1.79","DOI":"10.1162\/NECO.1991.3.1.79"},{"key":"e_1_3_3_1_12_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00273"},{"key":"e_1_3_3_1_13_2","doi-asserted-by":"publisher","DOI":"10.1609\/AAAI.V34I07.6796"},{"key":"e_1_3_3_1_14_2","unstructured":"Shihao Li Aihua Zheng Andong Lu Jin Tang and Jixin Ma. 2025. NEXT: Multi-Grained Mixture of Experts via Text-Modulation for Multi-Modal Object Re-Identification. arxiv:https:\/\/arXiv.org\/abs\/2505.20001\u00a0[cs.CV] https:\/\/arxiv.org\/abs\/2505.20001"},{"key":"e_1_3_3_1_15_2","first-page":"1047","volume-title":"Proceedings of the Thirty-Third International Joint Conference on Artificial Intelligence, IJCAI 2024, Jeju, South Korea, August 3-9, 2024","author":"Li Zongyi","year":"2024","unstructured":"Zongyi Li, Jianbo Li, Yuxuan Shi, Hefei Ling, Jiazhong Chen, Runsheng Wang, and Shijuan Huang. 2024. Cross-modal Generation and Alignment via Attribute-guided Prompt for Unsupervised Text-based Person Retrieval. In Proceedings of the Thirty-Third International Joint Conference on Artificial Intelligence, IJCAI 2024, Jeju, South Korea, August 3-9, 2024. ijcai.org, 1047\u20131055. https:\/\/www.ijcai.org\/proceedings\/2024\/116"},{"key":"e_1_3_3_1_16_2","volume-title":"Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022","author":"Liang Weixin","year":"2022","unstructured":"Weixin Liang, Yuhui Zhang, Yongchan Kwon, Serena Yeung, and James\u00a0Y. Zou. 2022. Mind the Gap: Understanding the Modality Gap in Multi-modal Contrastive Representation Learning. In Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022, Sanmi Koyejo, S.\u00a0Mohamed, A.\u00a0Agarwal, Danielle Belgrave, K.\u00a0Cho, and A.\u00a0Oh (Eds.). http:\/\/papers.nips.cc\/paper_files\/paper\/2022\/hash\/702f4db7543a7432431df588d57bc7c9-Abstract-Conference.html"},{"key":"e_1_3_3_1_17_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i2.25273"},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00063"},{"key":"e_1_3_3_1_19_2","unstructured":"Alec Radford Jong\u00a0Wook Kim Chris Hallacy Aditya Ramesh Gabriel Goh Sandhini Agarwal Girish Sastry Amanda Askell Pamela Mishkin Jack Clark Gretchen Krueger and Ilya Sutskever. 2021. Learning Transferable Visual Models From Natural Language Supervision. arxiv:https:\/\/arXiv.org\/abs\/2103.00020\u00a0[cs.CV] https:\/\/arxiv.org\/abs\/2103.00020"},{"key":"e_1_3_3_1_20_2","volume-title":"5th International Conference on Learning Representations, ICLR 2017, Toulon, France, April 24-26, 2017, Conference Track Proceedings","author":"Shazeer Noam","year":"2017","unstructured":"Noam Shazeer, Azalia Mirhoseini, Krzysztof Maziarz, Andy Davis, Quoc\u00a0V. Le, Geoffrey\u00a0E. Hinton, and Jeff Dean. 2017. Outrageously Large Neural Networks: The Sparsely-Gated Mixture-of-Experts Layer. In 5th International Conference on Learning Representations, ICLR 2017, Toulon, France, April 24-26, 2017, Conference Track Proceedings. OpenReview.net. https:\/\/openreview.net\/forum?id=B1ckMDqlg"},{"key":"e_1_3_3_1_21_2","doi-asserted-by":"publisher","DOI":"10.18653\/V1\/2023.FINDINGS-EMNLP.758"},{"key":"e_1_3_3_1_22_2","volume-title":"NeurIPS","author":"Shi Jiangming","year":"2024","unstructured":"Jiangming Shi, Xiangbo Yin, Yachao Zhang, Zhizhong Zhang, Yuan Xie, and Yanyun Qu. 2024. Learning Commonality, Divergence and Variety for Unsupervised Visible-Infrared Person Re-identification. In NeurIPS."},{"key":"e_1_3_3_1_23_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01030"},{"key":"e_1_3_3_1_24_2","unstructured":"Vishaal Udandarao Abhishek Maiti Deepak Srivatsav Suryatej\u00a0Reddy Vyalla Yifang Yin and Rajiv\u00a0Ratn Shah. 2020. COBRA: Contrastive Bi-Modal Representation Algorithm. CoRR abs\/2005.03687 (2020). arXiv:https:\/\/arXiv.org\/abs\/2005.03687https:\/\/arxiv.org\/abs\/2005.03687"},{"key":"e_1_3_3_1_25_2","doi-asserted-by":"publisher","unstructured":"Xixi Wan Aihua Zheng Zi Wang Bo Jiang Jin Tang and Jixin Ma. 2025. Reliable Multi-Modal Object Re-Identification via Modality-Aware Graph Reasoning. CoRR abs\/2504.14847 (2025). arXiv:https:\/\/arXiv.org\/abs\/2504.1484710.48550\/ARXIV.2504.14847","DOI":"10.48550\/ARXIV.2504.14847"},{"key":"e_1_3_3_1_26_2","doi-asserted-by":"publisher","DOI":"10.1145\/3240508.3240552"},{"key":"e_1_3_3_1_27_2","series-title":"Proceedings of Machine Learning Research","first-page":"552","volume-title":"Proceedings of the Thirty-Fifth Conference on Uncertainty in Artificial Intelligence, UAI 2019, Tel Aviv, Israel, July 22-25, 2019","volume":"115","author":"Wang Xin","year":"2019","unstructured":"Xin Wang, Fisher Yu, Lisa Dunlap, Yi-An Ma, Ruth Wang, Azalia Mirhoseini, Trevor Darrell, and Joseph\u00a0E. Gonzalez. 2019. Deep Mixture of Experts via Shallow Embedding. In Proceedings of the Thirty-Fifth Conference on Uncertainty in Artificial Intelligence, UAI 2019, Tel Aviv, Israel, July 22-25, 2019(Proceedings of Machine Learning Research, Vol.\u00a0115), Amir Globerson and Ricardo Silva (Eds.). AUAI Press, 552\u2013562. http:\/\/proceedings.mlr.press\/v115\/wang20d.html"},{"key":"e_1_3_3_1_28_2","doi-asserted-by":"publisher","DOI":"10.1609\/AAAI.V39I8.32879"},{"key":"e_1_3_3_1_29_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i6.28388"},{"key":"e_1_3_3_1_30_2","doi-asserted-by":"publisher","DOI":"10.1609\/AAAI.V39I8.32878"},{"key":"e_1_3_3_1_31_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.02765"},{"key":"e_1_3_3_1_32_2","doi-asserted-by":"publisher","DOI":"10.1609\/AAAI.V36I3.20165"},{"key":"e_1_3_3_1_33_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00071"},{"key":"e_1_3_3_1_34_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.575"},{"key":"e_1_3_3_1_35_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01021"},{"key":"e_1_3_3_1_36_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01596"},{"key":"e_1_3_3_1_37_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00692"},{"key":"e_1_3_3_1_38_2","doi-asserted-by":"publisher","unstructured":"Tianyu Zang Yunrui Guo Pan Wang Yuwei Gao and Yuan Zhou. 2025. Enhancing cross-modal person reidentification: multi-scale feature alignment and optimization. The Visual Computer 42 1 (Dec. 2025). 10.1007\/s00371-025-04231-x","DOI":"10.1007\/s00371-025-04231-x"},{"key":"e_1_3_3_1_39_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i7.28524"},{"key":"e_1_3_3_1_40_2","doi-asserted-by":"publisher","unstructured":"Chao Zhang Weifeng Zhong Changfeng Li and Haipeng Deng. 2023. Random walk-based erasing data augmentation for deep learning. Signal Image Video Process. 17 5 (2023) 2447\u20132454. 10.1007\/S11760-022-02461-3","DOI":"10.1007\/S11760-022-02461-3"},{"key":"e_1_3_3_1_41_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01620"},{"key":"e_1_3_3_1_42_2","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3613757"},{"key":"e_1_3_3_1_43_2","doi-asserted-by":"publisher","unstructured":"Aihua Zheng Zhiqi Ma Yongqi Sun Zi Wang Chenglong Li and Jin Tang. 2025. Flare-aware cross-modal enhancement network for multi-spectral vehicle Re-identification. Inf. Fusion 116 (2025) 102800. 10.1016\/J.INFFUS.2024.102800","DOI":"10.1016\/J.INFFUS.2024.102800"},{"key":"e_1_3_3_1_44_2","doi-asserted-by":"publisher","DOI":"10.1609\/AAAI.V35I4.16467"},{"key":"e_1_3_3_1_45_2","doi-asserted-by":"publisher","unstructured":"Aihua Zheng Xianpeng Zhu Zhiqi Ma Chenglong Li Jin Tang and Jixin Ma. 2023. Cross-directional consistency network with adaptive layer normalization for multi-spectral vehicle re-identification and a high-quality benchmark. Inf. Fusion 100 (2023) 101901. 10.1016\/J.INFFUS.2023.101901","DOI":"10.1016\/J.INFFUS.2023.101901"},{"key":"e_1_3_3_1_46_2","doi-asserted-by":"publisher","unstructured":"Yuanxin Zhu Zhao Yang Li Wang Sai Zhao Xiao Hu and Dapeng Tao. 2020. Hetero-Center loss for cross-modality person Re-identification. Neurocomputing 386 (2020) 97\u2013109. 10.1016\/J.NEUCOM.2019.12.100","DOI":"10.1016\/J.NEUCOM.2019.12.100"}],"event":{"name":"ICMR '26: International Conference on Multimedia Retrieval","location":"Amsterdam The Netherlands","acronym":"ICMR '26","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 2026 International Conference on Multimedia Retrieval"],"original-title":[],"deposited":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T15:26:38Z","timestamp":1781537198000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3805622.3810820"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,6,15]]},"references-count":45,"alternative-id":["10.1145\/3805622.3810820","10.1145\/3805622"],"URL":"https:\/\/doi.org\/10.1145\/3805622.3810820","relation":{},"subject":[],"published":{"date-parts":[[2026,6,15]]},"assertion":[{"value":"2026-06-15","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}