{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T15:54:41Z","timestamp":1781538881380,"version":"3.54.5"},"publisher-location":"New York, NY, USA","reference-count":73,"publisher":"ACM","license":[{"start":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T00:00:00Z","timestamp":1781481600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,6,16]]},"DOI":"10.1145\/3805622.3810593","type":"proceedings-article","created":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T14:42:57Z","timestamp":1781534577000},"page":"1260-1269","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Learning Where to Embed: Noise-Aware Positional Embedding for Query Retrieval in Small-Object Detection"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0009-1956-4029","authenticated-orcid":false,"given":"Yangchen","family":"Zeng","sequence":"first","affiliation":[{"name":"Southeast University, Nanjing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9985-0165","authenticated-orcid":false,"given":"Zhenyu","family":"Yu","sequence":"additional","affiliation":[{"name":"Fudan University, Shanghai, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-2691-5046","authenticated-orcid":false,"given":"Dongming","family":"Jiang","sequence":"additional","affiliation":[{"name":"The University of Texas at Dallas, Dallas, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-6269-707X","authenticated-orcid":false,"given":"Wenbo","family":"Zhang","sequence":"additional","affiliation":[{"name":"Zhejiang Normal university, Hangzhou, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4702-0987","authenticated-orcid":false,"given":"Yifan","family":"Hong","sequence":"additional","affiliation":[{"name":"Data Space Research Institute, Hefei Comprehensive National Science Center, Hefei, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-6913-0224","authenticated-orcid":false,"given":"Zhanhua","family":"Hu","sequence":"additional","affiliation":[{"name":"Rice university, Houston, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-5786-7468","authenticated-orcid":false,"given":"Jiao","family":"Luo","sequence":"additional","affiliation":[{"name":"College of Informatics, Huazhong Agricultural University, Wuhan, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1856-5064","authenticated-orcid":false,"given":"Kangning","family":"Cui","sequence":"additional","affiliation":[{"name":"Wake Forest University, Winston-Salem, USA and City University of Hong Kong (Dongguan), Dongguan, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2026,6,15]]},"reference":[{"key":"e_1_3_3_1_2_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP46576.2022.9897990"},{"key":"e_1_3_3_1_3_2","unstructured":"Aduen Benjumea Izzeddin Teeti Fabio Cuzzolin and Andrew Bradley. 2021. YOLO-Z: Improving small object detection in YOLOv5 for autonomous vehicles. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2112.11798 (2021)."},{"key":"e_1_3_3_1_4_2","unstructured":"Alexey Bochkovskiy Chien-Yao Wang and Hong-Yuan\u00a0Mark Liao. 2020. Yolov4: Optimal speed and accuracy of object detection. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2004.10934 (2020)."},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00644"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"crossref","unstructured":"Si-Yuan Cao Beinan Yu Lun Luo Runmin Zhang Shu-Jie Chen Chunguang Li and Hui-Liang Shen. 2023. PCNet: A structure similarity enhancement method for multispectral and multimodal image registration. Inf. Fusion 94 (2023) 200\u2013214.","DOI":"10.1016\/j.inffus.2023.02.004"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"e_1_3_3_1_8_2","unstructured":"Chu Chen Aitor Artola Yang Liu Se\u00a0Weon Park Raymond\u00a0H Chan Jean-Michel Morel and Kannie\u00a0WY Chan. 2025. Blind Adaptive Local Denoising for CEST Imaging. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2511.20081 (2025)."},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISBI56570.2024.10635440"},{"key":"e_1_3_3_1_10_2","unstructured":"Gong Cheng Xiang Yuan Xiwen Yao Kebing Yan Qinghua Zeng Xingxing Xie and Junwei Han. 2023. Towards large-scale small object detection: Survey and benchmarks. IEEE TPAMI 45 11 (2023) 13467\u201313488."},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"crossref","unstructured":"Gong Cheng Peicheng Zhou and Junwei Han. 2016. Learning rotation-invariant convolutional neural networks for object detection in VHR optical remote sensing images. IEEE TGRS 54 12 (2016) 7405\u20137415.","DOI":"10.1109\/TGRS.2016.2601622"},{"key":"e_1_3_3_1_12_2","doi-asserted-by":"crossref","unstructured":"Kangning Cui Ruoning Li Sam\u00a0L Polk Yinyi Lin Hongsheng Zhang James\u00a0M Murphy Robert\u00a0J Plemmons and Raymond\u00a0H Chan. 2024. Superpixel-based and spatially regularized diffusion learning for unsupervised hyperspectral image clustering. IEEE Transactions on Geoscience and Remote Sensing 62 (2024) 1\u201318.","DOI":"10.1109\/TGRS.2024.3385202"},{"key":"e_1_3_3_1_13_2","doi-asserted-by":"publisher","DOI":"10.1145\/3603287.3651220"},{"key":"e_1_3_3_1_14_2","unstructured":"Kangning Cui Wei Tang Rongkun Zhu Manqi Wang Gregory\u00a0D Larsen Victor\u00a0P Pauca Sarra Alqahtani Fan Yang David Segurado Paul Fine et\u00a0al. 2025. Efficient Localization and Spatial Distribution Modeling of Canopy Palms Using UAV Imagery. IEEE TGRS (2025)."},{"key":"e_1_3_3_1_15_2","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2025\/1067"},{"key":"e_1_3_3_1_16_2","doi-asserted-by":"crossref","unstructured":"Xingyu Di Kangning Cui and Rui-Feng Wang. 2025. Toward Efficient UAV-Based Small Object Detection: A Lightweight Network with Enhanced Feature Fusion. Remote Sens. 17 13 (2025) 2235.","DOI":"10.3390\/rs17132235"},{"key":"e_1_3_3_1_17_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00667"},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"crossref","unstructured":"Mark Everingham Luc Van\u00a0Gool Christopher\u00a0KI Williams John Winn and Andrew Zisserman. 2010. The pascal visual object classes (voc) challenge. IJCV (2010).","DOI":"10.1007\/s11263-009-0275-4"},{"key":"e_1_3_3_1_19_2","first-page":"1","volume-title":"CVPR","author":"Farhadi Ali","year":"2018","unstructured":"Ali Farhadi, Joseph Redmon, et\u00a0al. 2018. Yolov3: An incremental improvement. In CVPR , Vol.\u00a01804. Springer Berlin\/Heidelberg, Germany, 1\u20136."},{"key":"e_1_3_3_1_20_2","doi-asserted-by":"crossref","unstructured":"Yuhang Han Bingchen Duan Renxiang Guan Guang Yang and Zhen Zhen. 2024. LUFFD-YOLO: A lightweight model for UAV remote sensing forest fire detection based on attention mechanism and multi-level feature fusion. Remote Sens. 16 12 (2024) 2177.","DOI":"10.3390\/rs16122177"},{"key":"e_1_3_3_1_21_2","doi-asserted-by":"crossref","unstructured":"Yu-Shan Han Sheng-Lun Zhao Chu Chen Kangning Cui Pingfan Hu and Rui-Feng Wang. 2026. SEAF-Net: A Sustainable and Lightweight Attention-Enhanced Detection Network for Underwater Fish Species Recognition. Journal of Marine Science and Engineering 14 4 (2026) 351.","DOI":"10.3390\/jmse14040351"},{"key":"e_1_3_3_1_22_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"e_1_3_3_1_23_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_3_1_24_2","unstructured":"Maolin He Rena Gao Mike Conway and Brian\u00a0E Chapman. 2024. Query pipeline optimization for cancer patient question answering systems. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2412.14751 (2024)."},{"key":"e_1_3_3_1_25_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.685"},{"key":"e_1_3_3_1_26_2","doi-asserted-by":"crossref","unstructured":"Yuchao Hou Ting Xu Hongping Hu Peng Wang Hongxin Xue and Yanping Bai. 2020. MdpCaps-CSL for SAR image target recognition with limited labeled training data. IEEE Access 8 (2020) 176217\u2013176231.","DOI":"10.1109\/ACCESS.2020.3026469"},{"key":"e_1_3_3_1_27_2","unstructured":"Yuchao Hou Shuai Zhao Xiaoyu Xia Minghui Liwang Zijian Li Nan Xu Di Wu Youliang Tian and Tony\u00a0QS Quek. 2025. FedC-DAC: A Federated Clustering with Dynamic Aggregation and Calibration Method for SAR Image Target Recognition. IEEE JSTAR (2025)."},{"key":"e_1_3_3_1_28_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00140"},{"key":"e_1_3_3_1_29_2","unstructured":"Dongming Jiang Yi Li Guanpeng Li and Bingzhe Li. 2026. MAGMA: A Multi-Graph based Agentic Memory Architecture for AI Agents. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2601.03236 (2026)."},{"key":"e_1_3_3_1_30_2","unstructured":"Dongming Jiang Yi Li Songtao Wei Jinxin Yang Ayushi Kishore Alysa Zhao Dingyi Kang Xu Hu Feng Chen Qiannan Li et\u00a0al. 2026. Anatomy of Agentic Memory: Taxonomy and Empirical Analysis of Evaluation and System Limitations. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2602.19320 (2026)."},{"key":"e_1_3_3_1_31_2","volume-title":"Forty-second International Conference on Machine Learning","author":"Jiang Ting","year":"2025","unstructured":"Ting Jiang, Yixiao Wang, Hancheng Ye, Zishan Shao, Jingwei Sun, Jingyang Zhang, Zekai Chen, Jianyi Zhang, Yiran Chen, and Hai Li. 2025. SADA: Stability-guided Adaptive Diffusion Acceleration. In Forty-second International Conference on Machine Learning."},{"key":"e_1_3_3_1_32_2","unstructured":"Rahima Khanam and Muhammad Hussain. 2024. Yolov11: An overview of the key architectural enhancements. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2410.17725 (2024)."},{"key":"e_1_3_3_1_33_2","unstructured":"Chuyi Li Lulu Li Hongliang Jiang Kaiheng Weng Yifei Geng Liang Li Zaidan Ke Qingyuan Li Meng Cheng Weiqiang Nie et\u00a0al. 2022. YOLOv6: A single-stage object detection framework for industrial applications. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2209.02976 (2022)."},{"key":"e_1_3_3_1_34_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01325"},{"key":"e_1_3_3_1_35_2","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3681043"},{"key":"e_1_3_3_1_36_2","doi-asserted-by":"crossref","unstructured":"Yihong Li Ting Wang Zhe Cao Haonan Xin and Rong Wang. 2025. Efficient unsupervised clustering of hyperspectral images via flexible multi-anchor graphs. Remote Sens. 17 15 (2025) 2647.","DOI":"10.3390\/rs17152647"},{"key":"e_1_3_3_1_37_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"e_1_3_3_1_38_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"e_1_3_3_1_39_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"e_1_3_3_1_40_2","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3681383"},{"key":"e_1_3_3_1_41_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00363"},{"key":"e_1_3_3_1_42_2","doi-asserted-by":"crossref","unstructured":"Fei Pan Yutong Wu Kangning Cui Shuxun Chen Yanfang Li Yaofang Liu Adnan Shakoor Han Zhao Beijia Lu Shaohua Zhi et\u00a0al. 2024. Accurate detection and instance segmentation of unstained living adherent cells in differential interference contrast images. Computers in Biology and Medicine 182 (2024) 109151.","DOI":"10.1016\/j.compbiomed.2024.109151"},{"key":"e_1_3_3_1_43_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00558"},{"key":"e_1_3_3_1_44_2","volume-title":"NeurIPS","author":"Rao Yongming","year":"2021","unstructured":"Yongming Rao, Wenliang Zhao, Benlin Liu, Jiwen Lu, Jie Zhou, and Cho-Jui Hsieh. 2021. DynamicViT: Efficient Vision Transformers with Dynamic Token Sparsification. In NeurIPS."},{"key":"e_1_3_3_1_45_2","volume-title":"NeurIPS","author":"Ren Shaoqing","year":"2015","unstructured":"Shaoqing Ren, Kaiming He, Ross Girshick, and Jian Sun. 2015. Faster R-CNN: Towards real-time object detection with region proposal networks. In NeurIPS."},{"key":"e_1_3_3_1_46_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v40i30.39720"},{"key":"e_1_3_3_1_47_2","doi-asserted-by":"crossref","unstructured":"Huihui Sun and Rui-Feng Wang. 2025. BMDNet-YOLO: A Lightweight and Robust Model for High-Precision Real-Time Recognition of Blueberry Maturity. Horticulturae 11 10 (2025) 1202.","DOI":"10.3390\/horticulturae11101202"},{"key":"e_1_3_3_1_48_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISBI56570.2024.10635760"},{"key":"e_1_3_3_1_49_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00972"},{"key":"e_1_3_3_1_50_2","unstructured":"Shuqin Tu Yunjie Tang Chengjie Li Yun Liang Yangchen Zeng and Xiaolong Liu. 2022. Behavior recognition and tracking of group-housed pigs based on improved ByteTrack algorithm. Trans. Chin. Soc. Agric. Mach. 53 12 (2022) 264\u2013272."},{"key":"e_1_3_3_1_51_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00721"},{"key":"e_1_3_3_1_52_2","doi-asserted-by":"crossref","unstructured":"Jinze Wang Yongli Ren Jie Li and Ke Deng. 2021. The footprint of factorization models and their applications in collaborative filtering. ACM Transactions on Information Systems (TOIS) 40 4 (2021) 1\u201332.","DOI":"10.1145\/3490475"},{"key":"e_1_3_3_1_53_2","unstructured":"Rui-Feng Wang Daniel Petti Yue Chen and Changying Li. 2026. DINOv3 Visual Representations for Blueberry Perception Toward Robotic Harvesting. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2603.02419 (2026)."},{"key":"e_1_3_3_1_54_2","first-page":"500","volume-title":"Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision","author":"Wang Rui-Feng","year":"2026","unstructured":"Rui-Feng Wang, Mingrui Xu, Matthew Bauer, Iago Schardong, Xiaowen Ma, Peng Chee, and Kangning Cui. 2026. Cott-ADNet: Lightweight Real-Time Cotton Boll and Flower Detection Under Field Conditions. In Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision. 500\u2013509."},{"key":"e_1_3_3_1_55_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00061"},{"key":"e_1_3_3_1_56_2","doi-asserted-by":"crossref","unstructured":"Wei Wei Yu Cheng Jiafeng He and Xiyue Zhu. 2024. A review of small object detection based on deep learning. Neural Comput. Appl. 36 12 (2024) 6283\u20136303.","DOI":"10.1007\/s00521-024-09422-6"},{"key":"e_1_3_3_1_57_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00009"},{"key":"e_1_3_3_1_58_2","volume-title":"AAAI","author":"Xiong Yunyang","year":"2021","unstructured":"Yunyang Xiong, Zhanpeng Zeng, Rudrasis Chakraborty, Mingxing Tan, Glenn Fung, Yin Li, and Vikas Singh. 2021. Nystr\u00f6mformer: A nystr\u00f6m-based algorithm for approximating self-attention. In AAAI."},{"key":"e_1_3_3_1_59_2","doi-asserted-by":"crossref","unstructured":"Xue Yang Junchi Yan Wenlong Liao Xiaokang Yang Jin Tang and Tao He. 2022. Scrdet++: Detecting small cluttered and rotated objects via instance-level feature denoising and rotation loss smoothing. IEEE TPAMI (2022).","DOI":"10.1109\/TPAMI.2022.3166956"},{"key":"e_1_3_3_1_60_2","volume-title":"NeurIPS 2025","author":"Yu Zhenyu","year":"2025","unstructured":"Zhenyu Yu, Mohd Yamani\u00a0Idna Idris, and Pei Wang. 2025. Visualizing Our Changing Earth: A Creative AI Framework for Democratizing Environmental Storytelling Through Satellite Imagery. In NeurIPS 2025."},{"key":"e_1_3_3_1_61_2","doi-asserted-by":"crossref","unstructured":"Zhenyu Yu Mohd Yamani\u00a0Idna Idris Pei Wang and Rizwan Qureshi. 2026. DINOv3-Powered Multi-Task Foundation Model for Quantitative Remote Sensing Estimation. AAAI 2026 40 48 (2026) 41455\u201341456.","DOI":"10.1609\/aaai.v40i48.42304"},{"key":"e_1_3_3_1_62_2","doi-asserted-by":"crossref","unstructured":"Zhenyu Yu Haoran Jiang Pei Wang Zizhen Lin and Yong Xiang. 2026. Spatiotemporal Alignment for Remote Sensing Image Recovery via Terrain-Aware Diffusion. ICASSP 2026 (2026).","DOI":"10.1109\/ICASSP55912.2026.11460753"},{"key":"e_1_3_3_1_63_2","doi-asserted-by":"crossref","unstructured":"Zhenyu Yu Chunlei Meng Yangchen Zeng Mohd Yamani\u00a0Idna Idris and Shuigeng Zhou. 2026. ADS-POI: Agentic Spatiotemporal State Decomposition for Next Point-of-Interest Recommendation. ACM ISBN (2026) 978\u20131.","DOI":"10.2139\/ssrn.6532638"},{"key":"e_1_3_3_1_64_2","doi-asserted-by":"crossref","unstructured":"Zhenyu Yu Chunlei Meng Yangchen Zeng Mohd Yamani\u00a0Idna Idris and Shuigeng Zhou. 2026. CaST-POI: Candidate-Conditioned Spatiotemporal Modeling for Next POI Recommendation. ACM ISBN (2026) 978\u20131.","DOI":"10.2139\/ssrn.6259379"},{"key":"e_1_3_3_1_65_2","doi-asserted-by":"crossref","unstructured":"Zhenyu Yu Jinnian Wang and Mohd Yamani\u00a0Idna Idris. 2025. IIDM: Improved implicit diffusion model with knowledge distillation to estimate the spatial distribution density of carbon stock in remote sensing imagery. KBS (2025) 115131.","DOI":"10.1016\/j.knosys.2025.115131"},{"key":"e_1_3_3_1_66_2","unstructured":"YangChen Zeng. 2025. Hmpe: Heatmap embedding for efficient transformer-based small object detection. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2504.13469 (2025)."},{"key":"e_1_3_3_1_67_2","unstructured":"Yangchen Zeng. 2026. DeepInterestGR: Mining Deep Multi-Interest Using Multi-Modal LLMs for Generative Recommendation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2602.18907 (2026)."},{"key":"e_1_3_3_1_68_2","volume-title":"ICLR","author":"Zhang Hao","year":"2023","unstructured":"Hao Zhang, Feng Li, Shilong Liu, Lei Zhang, Hang Su, Jun Zhu, Lionel Ni, and Harry Shum. 2023. Dino: Detr with improved denoising anchor boxes for end-to-end object detection. In ICLR."},{"key":"e_1_3_3_1_69_2","doi-asserted-by":"crossref","unstructured":"Jiaqing Zhang Jie Lei Weiying Xie Zhenman Fang Yunsong Li and Qian Du. 2023. SuperYOLO: Super resolution assisted object detection in multimodal remote sensing imagery. IEEE TGRS 61 (2023) 1\u201315.","DOI":"10.1109\/TGRS.2023.3258666"},{"key":"e_1_3_3_1_70_2","doi-asserted-by":"publisher","unstructured":"Wei Zhang Qin Huang Mengting Ma Yizhen Jiang Yun Chen Zhenhua Huang Wangyu Wu Kangning Cui Rongrong Lian Zhenkai Wu and Xiaowen Ma. 2026. Center-guided Classifier for Semantic Segmentation of Remote Sensing Images. IEEE TGRS (2026). 10.1109\/TGRS.2026.3657453","DOI":"10.1109\/TGRS.2026.3657453"},{"key":"e_1_3_3_1_71_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01605"},{"key":"e_1_3_3_1_72_2","unstructured":"Rongkun Zhu Kangning Cui Wei Tang Rui-Feng Wang Sarra Alqahtani David Lutz Fan Yang Paul Fine Jordan Karubian Robert Plemmons et\u00a0al. 2025. From Orthomosaics to Raw UAV Imagery: Enhancing Palm Detection and Crown-Center Localization. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2509.12400 (2025)."},{"key":"e_1_3_3_1_73_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00953"},{"key":"e_1_3_3_1_74_2","unstructured":"Xizhou Zhu Weijie Su Lewei Lu Bin Li Xiaogang Wang and Jifeng Dai. 2020. Deformable DETR: Deformable transformers for end-to-end object detection. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2010.04159 (2020)."}],"event":{"name":"ICMR '26: International Conference on Multimedia Retrieval","location":"Amsterdam The Netherlands","acronym":"ICMR '26","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 2026 International Conference on Multimedia Retrieval"],"original-title":[],"deposited":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T15:02:41Z","timestamp":1781535761000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3805622.3810593"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,6,15]]},"references-count":73,"alternative-id":["10.1145\/3805622.3810593","10.1145\/3805622"],"URL":"https:\/\/doi.org\/10.1145\/3805622.3810593","relation":{},"subject":[],"published":{"date-parts":[[2026,6,15]]},"assertion":[{"value":"2026-06-15","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}