{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T14:56:11Z","timestamp":1781535371612,"version":"3.54.5"},"publisher-location":"New York, NY, USA","reference-count":45,"publisher":"ACM","license":[{"start":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T00:00:00Z","timestamp":1781481600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,6,16]]},"DOI":"10.1145\/3805622.3810663","type":"proceedings-article","created":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T14:42:57Z","timestamp":1781534577000},"page":"347-355","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Global-Regional Dual Hashing for Unsupervised Visual-Textual Retrieval via Concept Similarity Guidance"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8406-0606","authenticated-orcid":false,"given":"Yewen","family":"Li","sequence":"first","affiliation":[{"name":"College of Computer Science and Technology, National University of Defense Technology, Changsha, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-5128-5070","authenticated-orcid":false,"given":"Zongwei","family":"Tang","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, National University of Defense Technology, Changsha, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8949-5967","authenticated-orcid":false,"given":"Xiaodong","family":"Wang","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, National University of Defense Technology, Changsha, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2026,6,15]]},"reference":[{"key":"e_1_3_3_1_2_2","doi-asserted-by":"crossref","unstructured":"Hangbo Bao Wenhui Wang Li Dong Qiang Liu Owais\u00a0Khan Mohammed Kriti Aggarwal Subhojit Som Songhao Piao and Furu Wei. 2022. Vlmo: Unified vision-language pre-training with mixture-of-modality-experts. Advances in Neural Information Processing Systems 35 (2022) 32897\u201332912.","DOI":"10.52202\/068431-2384"},{"key":"e_1_3_3_1_3_2","volume-title":"ICLR","author":"Chen Guangyi","year":"2023","unstructured":"Guangyi Chen, Weiran Yao, Xiangchen Song, Xinyue Li, Yongming Rao, and Kun Zhang. 2023. PLOT: Prompt Learning with Optimal Transport for Vision-Language Models. In ICLR."},{"key":"e_1_3_3_1_4_2","doi-asserted-by":"publisher","DOI":"10.1145\/3485447.3511968"},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"publisher","DOI":"10.1145\/1646396.1646452"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"crossref","unstructured":"Jinrong Cui Zhipeng He Qiong Huang Yulu Fu Yuting Li and Jie Wen. 2024. Structure-aware contrastive hashing for unsupervised cross-modal retrieval. Neural Networks (2024) 106211.","DOI":"10.1016\/j.neunet.2024.106211"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v39i3.32290"},{"key":"e_1_3_3_1_8_2","doi-asserted-by":"crossref","unstructured":"Lunke Fei Zhihao He Wai\u00a0Keung Wong Qi Zhu Shuping Zhao and Jie Wen. 2025. Semantic decomposition and enhancement hashing for deep cross-modal retrieval. Pattern Recognition 160 (2025) 111225.","DOI":"10.1016\/j.patcog.2024.111225"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00319"},{"key":"e_1_3_3_1_10_2","unstructured":"Zhikai Hu Yiu-ming Cheung Mengke Li and Weichao Lan. 2024. Cross-modal hashing method with properties of hamming space: A new perspective. IEEE Transactions on Pattern Analysis and Machine Intelligence (2024)."},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"publisher","DOI":"10.1145\/1460096.1460104"},{"key":"e_1_3_3_1_12_2","doi-asserted-by":"crossref","unstructured":"Yadong Huo Qibing Qin Jiangyan Dai Lei Wang Wenfeng Zhang Lei Huang and Chengduan Wang. 2023. Deep semantic-aware proxy hashing for multi-label cross-modal retrieval. IEEE Transactions on Circuits and Systems for Video Technology 34 1 (2023) 576\u2013589.","DOI":"10.1109\/TCSVT.2023.3285266"},{"key":"e_1_3_3_1_13_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.348"},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"crossref","unstructured":"Salman Khan Muzammal Naseer Munawar Hayat Syed\u00a0Waqas Zamir Fahad\u00a0Shahbaz Khan and Mubarak Shah. 2022. Transformers in vision: A survey. ACM computing surveys (CSUR) 54 10s (2022) 1\u201341.","DOI":"10.1145\/3505244"},{"key":"e_1_3_3_1_15_2","first-page":"5583","volume-title":"International conference on machine learning","author":"Kim Wonjae","year":"2021","unstructured":"Wonjae Kim, Bokyung Son, and Ildoo Kim. 2021. Vilt: Vision-and-language transformer without convolution or region supervision. In International conference on machine learning. PMLR, 5583\u20135594."},{"key":"e_1_3_3_1_16_2","doi-asserted-by":"publisher","DOI":"10.1145\/3591106.3592283"},{"key":"e_1_3_3_1_17_2","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3681112"},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"publisher","DOI":"10.1145\/3397271.3401086"},{"key":"e_1_3_3_1_19_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01029"},{"key":"e_1_3_3_1_20_2","unstructured":"Qibing Qin Lei Wu Wenfeng Zhang Lei Huang and Jie Nie. 2025. Deep Semantic-consistent Penalizing Hashing for Cross-modal Retrieval. IEEE Transactions on Multimedia (2025)."},{"key":"e_1_3_3_1_21_2","first-page":"8748","volume-title":"International conference on machine learning","author":"Radford Alec","year":"2021","unstructured":"Alec Radford, Jong\u00a0Wook Kim, Chris Hallacy, Aditya Ramesh, Gabriel Goh, Sandhini Agarwal, Girish Sastry, Amanda Askell, Pamela Mishkin, Jack Clark, et\u00a0al. 2021. Learning transferable visual models from natural language supervision. In International conference on machine learning. PmLR, 8748\u20138763."},{"key":"e_1_3_3_1_22_2","doi-asserted-by":"crossref","unstructured":"Enrico\u00a0De Santis Alessio Martino Francesca Ronci and Antonello Rizzi. 2025. From Bag-of-Words to Transformers: A Comparative Study for Text Classification in Healthcare Discussions in Social Media. IEEE Transactions on Emerging Topics in Computational Intelligence (2025) 1063\u20131077. Issue 1.","DOI":"10.1109\/TETCI.2024.3423444"},{"key":"e_1_3_3_1_23_2","unstructured":"Xiaobo Shen Yinfan Chen Weiwei Liu Yuhui Zheng Quan-Sen Sun and Shirui Pan. 2024. Graph convolutional multi-label hashing for cross-modal retrieval. IEEE Transactions on Neural Networks and Learning Systems (2024)."},{"key":"e_1_3_3_1_24_2","doi-asserted-by":"crossref","unstructured":"Yufeng Shi Yue Zhao Xin Liu and et\u00a0al. Zheng. 2022. Deep adaptively-enhanced hashing with discriminative similarity guidance for unsupervised cross-modal retrieval. IEEE Transactions on Circuits and Systems for Video Technology 32 10 (2022) 7255\u20137268.","DOI":"10.1109\/TCSVT.2022.3172716"},{"key":"e_1_3_3_1_25_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00312"},{"key":"e_1_3_3_1_26_2","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3680633"},{"key":"e_1_3_3_1_27_2","doi-asserted-by":"publisher","DOI":"10.1145\/3477495.3531947"},{"key":"e_1_3_3_1_28_2","unstructured":"Junfeng Tu Xueliang Liu Yanbin Hao Richang Hong and Meng Wang. 2024. Two-step discrete hashing for cross-modal retrieval. IEEE Transactions on Multimedia (2024)."},{"key":"e_1_3_3_1_29_2","unstructured":"Junfeng Tu Xueliang Liu Zhen Huang Yanbin Hao Richang Hong and Meng Wang. 2025. Cross-Modal Hashing via Diverse Instances Matching. IEEE Transactions on Image Processing (2025)."},{"key":"e_1_3_3_1_30_2","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3548187"},{"key":"e_1_3_3_1_31_2","unstructured":"Rong-Cheng Tu Jie Jiang Qinghong Lin Chengfei Cai Shangxuan Tian Hongfa Wang and Wei Liu. 2023. Unsupervised Cross-modal Hashing with Modality-interaction. IEEE Transactions on Circuits and Systems for Video Technology (2023)."},{"key":"e_1_3_3_1_32_2","unstructured":"Rong-Cheng Tu Xian-Ling Mao Qinghong Lin Wenjin Ji Weize Qin Wei Wei and Heyan Huang. 2023. Unsupervised Cross-modal Hashing via Semantic Text Mining. IEEE Transactions on Multimedia (2023) 1\u201312."},{"key":"e_1_3_3_1_33_2","doi-asserted-by":"crossref","unstructured":"Di Wang Jiabo Tian Xiao Liang Yumin Tian and Lihuo He. 2025. Global-aware Fragment Representation Aggregation Network for image\u2013text retrieval. Pattern Recognition 159 (2025) 111085.","DOI":"10.1016\/j.patcog.2024.111085"},{"key":"e_1_3_3_1_34_2","doi-asserted-by":"crossref","unstructured":"Rukai Wei Yu Liu Heng Cui and et\u00a0al. Yanzhao\u00a0Xie. 2025. Graph Contrastive-and-Reconstructive Hashing for Unsupervised Cross-Modal Retrieval. Data Science and Engineering (2025) 411\u2013427. Issue 3.","DOI":"10.1007\/s41019-025-00282-1"},{"key":"e_1_3_3_1_35_2","unstructured":"Dongqing Wu Huihui Li Cang Gu Lei Guo and Hang Liu. 2024. Dual Stream Relation Learning Network for Image-Text Retrieval. IEEE Transactions on Multimedia (2024)."},{"key":"e_1_3_3_1_36_2","doi-asserted-by":"publisher","DOI":"10.1145\/3511808.3557265"},{"key":"e_1_3_3_1_37_2","unstructured":"Qingpeng Wu Zheng Zhang Yishu Liu Jingyi Zhang and Liqiang Nie. 2024. Contrastive Multi-Bit Collaborative Learning for Deep Cross-Modal Hashing. IEEE Transactions on Knowledge and Data Engineering (2024)."},{"key":"e_1_3_3_1_38_2","doi-asserted-by":"publisher","DOI":"10.1145\/3372278.3390673"},{"key":"e_1_3_3_1_39_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i5.16592"},{"key":"e_1_3_3_1_40_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01100"},{"key":"e_1_3_3_1_41_2","doi-asserted-by":"crossref","unstructured":"Peng-Fei Zhang Yang Li Zi Huang and Xin-Shun Xu. 2022. Aggregation-Based Graph Convolutional Hashing for Unsupervised Cross-Modal Retrieval. IEEE Transactions on Multimedia 24 (2022) 466\u2013479.","DOI":"10.1109\/TMM.2021.3053766"},{"key":"e_1_3_3_1_42_2","doi-asserted-by":"crossref","unstructured":"Yan Zhang Zhong Ji Yanwei Pang and Jungong Han. 2025. Hierarchical and complementary experts transformer with momentum invariance for image-text retrieval. Knowledge-Based Systems 309 (2025) 112912.","DOI":"10.1016\/j.knosys.2024.112912"},{"key":"e_1_3_3_1_43_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01631"},{"key":"e_1_3_3_1_44_2","doi-asserted-by":"crossref","unstructured":"Kaiyang Zhou Jingkang Yang Chen\u00a0Change Loy and Ziwei Liu. 2022. Learning to prompt for vision-language models. International Journal of Computer Vision 130 9 (2022) 2337\u20132348.","DOI":"10.1007\/s11263-022-01653-1"},{"key":"e_1_3_3_1_45_2","doi-asserted-by":"crossref","unstructured":"Lei Zhu Runbing Wu Xinghui Zhu Chengyuan Zhang Lin Wu Shichao Zhang and Xuelong Li. 2024. Bi-Direction Label-Guided Semantic Enhancement for Cross-Modal Hashing. IEEE Transactions on Circuits and Systems for Video Technology (2024).","DOI":"10.1109\/TCSVT.2024.3521646"},{"key":"e_1_3_3_1_46_2","doi-asserted-by":"crossref","unstructured":"Lei Zhu Xize Wu Jingjing Li Zheng Zhang Weili Guan and Heng\u00a0Tao Shen. 2023. Work Together: Correlation-Identity Reconstruction Hashing for Unsupervised Cross-Modal Retrieval. IEEE Transactions on Knowledge and Data Engineering (2023) 8838\u20138851. Issue 9.","DOI":"10.1109\/TKDE.2022.3218656"}],"event":{"name":"ICMR '26: International Conference on Multimedia Retrieval","location":"Amsterdam The Netherlands","acronym":"ICMR '26","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 2026 International Conference on Multimedia Retrieval"],"original-title":[],"deposited":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T14:48:51Z","timestamp":1781534931000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3805622.3810663"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,6,15]]},"references-count":45,"alternative-id":["10.1145\/3805622.3810663","10.1145\/3805622"],"URL":"https:\/\/doi.org\/10.1145\/3805622.3810663","relation":{},"subject":[],"published":{"date-parts":[[2026,6,15]]},"assertion":[{"value":"2026-06-15","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}