{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,11]],"date-time":"2026-02-11T21:30:53Z","timestamp":1770845453981,"version":"3.50.1"},"reference-count":28,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,5]],"date-time":"2025-10-05T00:00:00Z","timestamp":1759622400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,5]],"date-time":"2025-10-05T00:00:00Z","timestamp":1759622400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,5]]},"DOI":"10.1109\/smc58881.2025.11343398","type":"proceedings-article","created":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T20:54:44Z","timestamp":1769633684000},"page":"716-721","source":"Crossref","is-referenced-by-count":0,"title":["Difference-Guided Modality Fusion Network for Multimodal Object Detection"],"prefix":"10.1109","author":[{"given":"Linxuan","family":"Li","sequence":"first","affiliation":[{"name":"Xi&#x2019;an Jiaotong University,National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, National Engineering Research Center for Visual Information and Applications, and Institute of Artificial Intelligence and Robotics,Xi&#x2019;an,China,710049"}]},{"given":"Meiqin","family":"Liu","sequence":"additional","affiliation":[{"name":"Xi&#x2019;an Jiaotong University,National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, National Engineering Research Center for Visual Information and Applications, and Institute of Artificial Intelligence and Robotics,Xi&#x2019;an,China,710049"}]},{"given":"Jian","family":"Lan","sequence":"additional","affiliation":[{"name":"Xi&#x2019;an Jiaotong University,School of Electronics and Information Engineering,Xi&#x2019;an,China,710049"}]},{"given":"Shanling","family":"Dong","sequence":"additional","affiliation":[{"name":"Zhejiang University,College of Electrical Engineering,Hangzhou,China,310027"}]},{"given":"Zhunga","family":"Liu","sequence":"additional","affiliation":[{"name":"Northwestern Polytechnical University,School of Automation,Xi&#x2019;an,China,710072"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.3390\/automation5040029"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2024.102492"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2023.3258666"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW63382.2024.00305"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/JSEN.2024.3386709"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW63382.2024.00563"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2024.02.012"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.109913"},{"key":"ref9","article-title":"Attention is all you need","author":"Vaswani","year":"2017","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01104"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TIV.2024.3443264"},{"key":"ref12","article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","volume-title":"International Conference on Learning Representations","author":"Dosovitskiy"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00326"},{"key":"ref14","article-title":"Omni-dimensional dynamic convolution","author":"Li","year":"2022"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/S0016-0032(96)00063-4"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP40778.2020.9191080"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW54120.2021.00389"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00571"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"ref20","article-title":"Cross-modality fusion transformer for multispectral object detection","author":"Qingyun","year":"2021"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20077-9_9"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2022.3168279"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW59228.2023.00046"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TIV.2024.3393015"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01906"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/JAS.2022.106082"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00572"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3612135"}],"event":{"name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","location":"Vienna, Austria","start":{"date-parts":[[2025,10,5]]},"end":{"date-parts":[[2025,10,8]]}},"container-title":["2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11342430\/11342431\/11343398.pdf?arnumber=11343398","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,11]],"date-time":"2026-02-11T20:50:48Z","timestamp":1770843048000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11343398\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,5]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/smc58881.2025.11343398","relation":{},"subject":[],"published":{"date-parts":[[2025,10,5]]}}}