{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T05:04:24Z","timestamp":1750309464202,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":35,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,12,13]],"date-time":"2024-12-13T00:00:00Z","timestamp":1734048000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,12,13]]},"DOI":"10.1145\/3702250.3702270","type":"proceedings-article","created":{"date-parts":[[2024,12,31]],"date-time":"2024-12-31T12:11:38Z","timestamp":1735647098000},"page":"1-9","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["APMSA: Crossmodal Remote Sensing Image Retrieval using Attention Pooling and Multimodal Semantic Alignment"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4093-1470","authenticated-orcid":false,"given":"Aparna","family":"H","sequence":"first","affiliation":[{"name":"National Institute of Technology Tiruchirappalli, Tiruchirappalli, IN"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2276-3618","authenticated-orcid":false,"given":"Avik","family":"Hati","sequence":"additional","affiliation":[{"name":"NIT Tiruchirappalli, Tiruchirappalli, IN"}]}],"member":"320","published-online":{"date-parts":[[2024,12,31]]},"reference":[{"doi-asserted-by":"crossref","unstructured":"Mohamad\u00a0M Al\u00a0Rahhal Yakoub Bazi Norah\u00a0A Alsharif Laila Bashmal Naif Alajlan and Farid Melgani. 2022. Multilanguage transformer for improved text to remote sensing image retrieval. IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing 15 (2022) 9115\u20139126.","key":"e_1_3_3_1_2_2","DOI":"10.1109\/JSTARS.2022.3215803"},{"doi-asserted-by":"crossref","unstructured":"Ushasi Chaudhuri Biplab Banerjee Avik Bhattacharya and Mihai Datcu. 2020. CMIR-NET: A deep learning based model for cross-modal retrieval in remote sensing. Pattern recognition letters 131 (2020) 456\u2013462.","key":"e_1_3_3_1_3_2","DOI":"10.1016\/j.patrec.2020.02.006"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_4_2","DOI":"10.1109\/IGARSS47720.2021.9554838"},{"doi-asserted-by":"crossref","unstructured":"Qimin Cheng Yuzhuo Zhou Peng Fu Yuan Xu and Liang Zhang. 2021. A deep semantic alignment network for the cross-modal image-text retrieval in remote sensing. IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing 14 (2021) 4284\u20134297.","key":"e_1_3_3_1_5_2","DOI":"10.1109\/JSTARS.2021.3070872"},{"doi-asserted-by":"crossref","unstructured":"Yunchao Gong Svetlana Lazebnik Albert Gordo and Florent Perronnin. 2012. Iterative quantization: A procrustean approach to learning binary codes for large-scale image retrieval. IEEE transactions on pattern analysis and machine intelligence 35 12 (2012) 2916\u20132929.","key":"e_1_3_3_1_6_2","DOI":"10.1109\/TPAMI.2012.193"},{"doi-asserted-by":"crossref","unstructured":"Lirong Han Mercedes\u00a0E Paoletti Xuanwen Tao Zhaoyue Wu Juan\u00a0M Haut Javier Plaza and Antonio Plaza. 2023. Central cohesion gradual hashing for remote sensing image retrieval. IEEE Geoscience and Remote Sensing Letters 20 (2023) 1\u20135.","key":"e_1_3_3_1_7_2","DOI":"10.1109\/LGRS.2023.3241849"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_8_2","DOI":"10.1109\/IGARSS.2018.8519248"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_9_2","DOI":"10.1007\/978-3-319-24261-3_7"},{"doi-asserted-by":"crossref","unstructured":"Dongyang Hou Siyuan Wang Xueqing Tian and Huaqiao Xing. 2022. An attention-enhanced end-to-end discriminative network with multiscale feature learning for remote sensing image retrieval. IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing 15 (2022) 8245\u20138255.","key":"e_1_3_3_1_10_2","DOI":"10.1109\/JSTARS.2022.3208107"},{"doi-asserted-by":"crossref","unstructured":"Mengluan Huang Le Dong Weisheng Dong and Guangming Shi. 2023. Supervised contrastive learning based on fusion of global and local features for remote sensing image retrieval. IEEE Transactions on Geoscience and Remote Sensing 61 (2023) 1\u201313.","key":"e_1_3_3_1_11_2","DOI":"10.1109\/TGRS.2023.3275644"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_12_2","DOI":"10.1109\/CVPR.2017.348"},{"unstructured":"Diederik\u00a0P Kingma and Jimmy Ba. 2015. Adam: A method for stochastic optimization. International Conference on Learning Representations (ICLR).","key":"e_1_3_3_1_13_2"},{"doi-asserted-by":"crossref","unstructured":"Haoran Li Wei Xiong Yaqi Cui and Zhenyu Xiong. 2022. A fusion-based contrastive learning model for cross-modal remote sensing retrieval. International Journal of Remote Sensing 43 9 (2022) 3359\u20133386.","key":"e_1_3_3_1_14_2","DOI":"10.1080\/01431161.2022.2091964"},{"doi-asserted-by":"crossref","unstructured":"Yansheng Li Jiayi Ma and Yongjun Zhang. 2021. Image retrieval from remote sensing big data: A survey. Information Fusion 67 (2021) 94\u2013115.","key":"e_1_3_3_1_15_2","DOI":"10.1016\/j.inffus.2020.10.008"},{"doi-asserted-by":"crossref","unstructured":"Yansheng Li Yongjun Zhang Xin Huang and Jiayi Ma. 2018. Learning source-invariant deep hashing convolutional neural networks for cross-source remote sensing image retrieval. IEEE Transactions on Geoscience and Remote Sensing 56 11 (2018) 6521\u20136536.","key":"e_1_3_3_1_16_2","DOI":"10.1109\/TGRS.2018.2839705"},{"doi-asserted-by":"crossref","unstructured":"Chao Liu Jingjing Ma Xu Tang Fang Liu Xiangrong Zhang and Licheng Jiao. 2020. Deep hash learning for remote sensing image retrieval. IEEE Transactions on Geoscience and Remote Sensing 59 4 (2020) 3420\u20133443.","key":"e_1_3_3_1_17_2","DOI":"10.1109\/TGRS.2020.3007533"},{"doi-asserted-by":"crossref","unstructured":"Yafei Lv Wei Xiong Xiaohan Zhang and Yaqi Cui. 2021. Fusion-based correlation learning model for cross-modal remote sensing image retrieval. IEEE Geoscience and Remote Sensing Letters 19 (2021) 1\u20135.","key":"e_1_3_3_1_18_2","DOI":"10.1109\/LGRS.2021.3131592"},{"key":"e_1_3_3_1_19_2","first-page":"8748","volume-title":"International conference on machine learning","author":"Radford Alec","year":"2021","unstructured":"Alec Radford, Jong\u00a0Wook Kim, Chris Hallacy, Aditya Ramesh, Gabriel Goh, Sandhini Agarwal, Girish Sastry, Amanda Askell, Pamela Mishkin, Jack Clark, et\u00a0al. 2021. Learning transferable visual models from natural language supervision. In International conference on machine learning. PMLR, 8748\u20138763."},{"doi-asserted-by":"crossref","unstructured":"SK Sudha and S Aji. 2019. A review on recent advances in remote sensing image retrieval techniques. Journal of the Indian Society of Remote Sensing 47 12 (2019) 2129\u20132139.","key":"e_1_3_3_1_20_2","DOI":"10.1007\/s12524-019-01049-8"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_21_2","DOI":"10.1109\/ICIP46576.2022.9897475"},{"doi-asserted-by":"crossref","unstructured":"Yuxi Sun Shanshan Feng Yunming Ye Xutao Li Jian Kang Zhichao Huang and Chuyao Luo. 2021. Multisensor fusion and explicit semantic preserving-based deep hashing for cross-modal remote sensing image retrieval. IEEE Transactions on Geoscience and Remote Sensing 60 (2021) 1\u201314.","key":"e_1_3_3_1_22_2","DOI":"10.1109\/TGRS.2021.3136641"},{"doi-asserted-by":"crossref","unstructured":"Xu Tang Yijing Wang Jingjing Ma Xiangrong Zhang Fang Liu and Licheng Jiao. 2023. Interacting-enhancing feature transformer for cross-modal remote-sensing image and text retrieval. IEEE Transactions on Geoscience and Remote Sensing 61 (2023) 1\u201315.","key":"e_1_3_3_1_23_2","DOI":"10.1109\/TGRS.2023.3280546"},{"unstructured":"Ashish Vaswani Noam Shazeer Niki Parmar Jakob Uszkoreit Llion Jones Aidan\u00a0N Gomez \u0141ukasz Kaiser and Illia Polosukhin. 2017. Attention is all you need. Advances in neural information processing systems 30 (2017) 6000\u2013\u20136010.","key":"e_1_3_3_1_24_2"},{"doi-asserted-by":"crossref","unstructured":"Zhuoyue Wang Xueqian Wang Gang Li and Chengxi Li. 2024. Robust Cross-Modal Remote Sensing Image Retrieval via Maximal Correlation Augmentation. IEEE Transactions on Geoscience and Remote Sensing (2024) 1\u201317.","key":"e_1_3_3_1_25_2","DOI":"10.1109\/TGRS.2024.3406606"},{"doi-asserted-by":"crossref","unstructured":"Wei Xiong Yafei Lv Xiaohan Zhang and Yaqi Cui. 2020. Learning to translate for cross-source remote sensing image retrieval. IEEE Transactions on Geoscience and Remote Sensing 58 7 (2020) 4860\u20134874.","key":"e_1_3_3_1_26_2","DOI":"10.1109\/TGRS.2020.2968096"},{"doi-asserted-by":"crossref","unstructured":"Wei Xiong Zhenyu Xiong Yaqi Cui and Yafei Lv. 2020. A discriminative distillation network for cross-source remote sensing image retrieval. IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing 13 (2020) 1234\u20131247.","key":"e_1_3_3_1_27_2","DOI":"10.1109\/JSTARS.2020.2980870"},{"doi-asserted-by":"crossref","unstructured":"Wei Xiong Zhenyu Xiong Yang Zhang Yaqi Cui and Xiangqi Gu. 2020. A deep cross-modality hashing network for SAR and optical remote sensing images retrieval. IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing 13 (2020) 5284\u20135296.","key":"e_1_3_3_1_28_2","DOI":"10.1109\/JSTARS.2020.3021390"},{"doi-asserted-by":"crossref","unstructured":"Hongfeng Yu Chubo Deng Liangjin Zhao Lingxiang Hao Xiaoyu Liu Wanxuan Lu and Hongjian You. 2023. A light-weighted hypergraph neural network for multimodal remote sensing image retrieval. IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing 16 (2023) 2690\u20132702.","key":"e_1_3_3_1_29_2","DOI":"10.1109\/JSTARS.2023.3252670"},{"doi-asserted-by":"crossref","unstructured":"Hongfeng Yu Fanglong Yao Wanxuan Lu Nayu Liu Peiguang Li Hongjian You and Xian Sun. 2022. Text-image matching for cross-modal remote sensing image retrieval via graph neural network. IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing 16 (2022) 812\u2013824.","key":"e_1_3_3_1_30_2","DOI":"10.1109\/JSTARS.2022.3231851"},{"doi-asserted-by":"crossref","unstructured":"Zhiqiang Yuan Wenkai Zhang Kun Fu Xuan Li Chubo Deng Hongqi Wang and Xian Sun. 2021. Exploring a Fine-Grained Multiscale Method for Cross-Modal Remote Sensing Image Retrieval. IEEE Transactions on Geoscience and Remote Sensing 60 (2021) 1\u201319.","key":"e_1_3_3_1_31_2","DOI":"10.1109\/TGRS.2021.3078451"},{"doi-asserted-by":"crossref","unstructured":"Zhiqiang Yuan Wenkai Zhang Changyuan Tian Yongqiang Mao Ruixue Zhou Hongqi Wang Kun Fu and Xian Sun. 2022. MCRN: A multi-source cross-modal retrieval network for remote sensing. International Journal of Applied Earth Observation and Geoinformation 115 (2022) 103071.","key":"e_1_3_3_1_32_2","DOI":"10.1016\/j.jag.2022.103071"},{"doi-asserted-by":"crossref","unstructured":"Zhiqiang Yuan Wenkai Zhang Changyuan Tian Xuee Rong Zhengyuan Zhang Hongqi Wang Kun Fu and Xian Sun. 2022. Remote sensing cross-modal text-image retrieval based on global and local information. IEEE Transactions on Geoscience and Remote Sensing 60 (2022) 1\u201316.","key":"e_1_3_3_1_33_2","DOI":"10.1109\/TGRS.2022.3163706"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_34_2","DOI":"10.1609\/aaai.v28i1.8995"},{"doi-asserted-by":"crossref","unstructured":"Yichao Zhang Xiangtao Zheng and Xiaoqiang Lu. 2023. Remote sensing image retrieval by deep attention hashing with distance-adaptive ranking. IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing 16 (2023) 4301\u20134311.","key":"e_1_3_3_1_35_2","DOI":"10.1109\/JSTARS.2023.3271303"},{"doi-asserted-by":"crossref","unstructured":"Weixun Zhou Haiyan Guan Ziyu Li Zhenfeng Shao and Mahmoud\u00a0R Delavar. 2023. Remote sensing image retrieval in the past decade: Achievements challenges and future directions. IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing 16 (2023) 1447\u20131473.","key":"e_1_3_3_1_36_2","DOI":"10.1109\/JSTARS.2023.3236662"}],"event":{"acronym":"ICVGIP 2024","name":"ICVGIP 2024: Indian Conference on Computer Vision Graphics and Image Processing","location":"Bengaluru Karnataka India"},"container-title":["Proceedings of the Fifteenth Indian Conference on Computer Vision Graphics and Image Processing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3702250.3702270","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3702250.3702270","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:10:32Z","timestamp":1750295432000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3702250.3702270"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,13]]},"references-count":35,"alternative-id":["10.1145\/3702250.3702270","10.1145\/3702250"],"URL":"https:\/\/doi.org\/10.1145\/3702250.3702270","relation":{},"subject":[],"published":{"date-parts":[[2024,12,13]]},"assertion":[{"value":"2024-12-31","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}