{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,9]],"date-time":"2026-05-09T07:13:41Z","timestamp":1778310821213,"version":"3.51.4"},"reference-count":56,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/501100004480","name":"Shanxi Province Natural Science Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100004480","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100020758","name":"Science and Technology Innovation Team of Shanxi Province","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100020758","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Expert Systems with Applications"],"published-print":{"date-parts":[[2026,9]]},"DOI":"10.1016\/j.eswa.2026.132619","type":"journal-article","created":{"date-parts":[[2026,5,2]],"date-time":"2026-05-02T14:47:43Z","timestamp":1777733263000},"page":"132619","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["FDDF: Frequency decomposition and spatial-frequency dual-domain fusion network for multi-spectral pedestrian detection"],"prefix":"10.1016","volume":"326","author":[{"ORCID":"https:\/\/orcid.org\/0009-0006-1524-2581","authenticated-orcid":false,"given":"Xiaowei","family":"Liu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5769-0565","authenticated-orcid":false,"given":"Gang","family":"Xie","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xinlin","family":"Xie","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xinying","family":"Xu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"78","reference":[{"key":"10.1016\/j.eswa.2026.132619_bib0001","series-title":"2025 4th International symposium on computer applications and information technology (ISCAIT)","first-page":"453","article-title":"Frequency-domain-based multispectral pedestrian detection network","author":"An","year":"2025"},{"key":"10.1016\/j.eswa.2026.132619_bib0002","series-title":"Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition","first-page":"403","article-title":"Multimodal object detection by channel switching and spatial attention","author":"Cao","year":"2023"},{"key":"10.1016\/j.eswa.2026.132619_bib0003","series-title":"European conference on computer vision","first-page":"139","article-title":"Multimodal object detection via probabilistic ensembling","author":"Chen","year":"2022"},{"key":"10.1016\/j.eswa.2026.132619_bib0004","doi-asserted-by":"crossref","first-page":"8298","DOI":"10.1109\/TMM.2025.3604937","article-title":"AMFD: Distillation via adaptive multimodal fusion for multispectral pedestrian detection","volume":"7","author":"Chen","year":"2025","journal-title":"IEEE Transactions on Multimedia"},{"key":"10.1016\/j.eswa.2026.132619_bib0005","doi-asserted-by":"crossref","first-page":"40","DOI":"10.1016\/j.inffus.2020.11.001","article-title":"Recent advances and new guidelines on hyperspectral and multispectral image fusion","volume":"69","author":"Dian","year":"2021","journal-title":"Information Fusion"},{"key":"10.1016\/j.eswa.2026.132619_bib0006","article-title":"D2fusion: Dual-domain feature decoupling for infrared and visible image fusion","volume":"332","author":"Fan","year":"2025","journal-title":"Knowledge-Based Systems"},{"issue":"10","key":"10.1016\/j.eswa.2026.132619_bib0007","doi-asserted-by":"crossref","first-page":"13232","DOI":"10.1109\/TNNLS.2023.3266452","article-title":"LRAF-Net: Long-range attention fusion network for visible\u2013infrared object detection","volume":"35","author":"Fu","year":"2023","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"key":"10.1016\/j.eswa.2026.132619_bib0008","series-title":"European conference on computer vision","first-page":"240","article-title":"Efficient frequency-domain image deraining with contrastive regularization","author":"Gao","year":"2024"},{"issue":"6","key":"10.1016\/j.eswa.2026.132619_bib0009","doi-asserted-by":"crossref","first-page":"820","DOI":"10.3390\/s16060820","article-title":"Pedestrian detection at day\/night time with visible and FIR cameras: A comparison","volume":"16","author":"Gonz\u00e1lez","year":"2016","journal-title":"Sensors"},{"key":"10.1016\/j.eswa.2026.132619_bib0010","doi-asserted-by":"crossref","first-page":"148","DOI":"10.1016\/j.inffus.2018.11.017","article-title":"Fusion of multispectral data through illumination-aware deep neural networks for pedestrian detection","volume":"50","author":"Guan","year":"2019","journal-title":"Information Fusion"},{"key":"10.1016\/j.eswa.2026.132619_bib0011","first-page":"3937","article-title":"Faster neural networks straight from jpeg","volume":"31","author":"Gueguen","year":"2018","journal-title":"Advances in Neural Information Processing Systems"},{"key":"10.1016\/j.eswa.2026.132619_bib0012","doi-asserted-by":"crossref","DOI":"10.1016\/j.patcog.2025.111383","article-title":"Multispectral transformer fusion via exploiting similarity and complementarity for robust pedestrian detection","volume":"162","author":"Hou","year":"2025","journal-title":"Pattern Recognition"},{"key":"10.1016\/j.eswa.2026.132619_bib0013","doi-asserted-by":"crossref","first-page":"4400","DOI":"10.1109\/TMM.2025.3543056","article-title":"Deformle cross-attention trnsformer for wekly aligned RGB\u2013T pedestrin detection","volume":"27","author":"Hu","year":"2025","journal-title":"IEEE Transactions on Multimedia"},{"key":"10.1016\/j.eswa.2026.132619_bib0014","series-title":"Proceedings of the IEEE conference on computer vision and pattern recognition","first-page":"1037","article-title":"Multispectral pedestrian detection: Benchmark dataset and baseline","author":"Hwang","year":"2015"},{"key":"10.1016\/j.eswa.2026.132619_bib0015","series-title":"Proceedings of the IEEE\/CVF international conference on computer vision","first-page":"3496","article-title":"LLVIP: A visible-infrared paired dataset for low-light vision","author":"Jia","year":"2021"},{"issue":"4","key":"10.1016\/j.eswa.2026.132619_bib0016","doi-asserted-by":"crossref","first-page":"7846","DOI":"10.1109\/LRA.2021.3099870","article-title":"MLPD: Multi-label pedestrian detector in multispectral domain","volume":"6","author":"Kim","year":"2021","journal-title":"IEEE Robotics and Automation Letters"},{"key":"10.1016\/j.eswa.2026.132619_bib0017","series-title":"Proceedings of the IEEE conference on computer vision and pattern recognition workshops","first-page":"49","article-title":"Fully convolutional region proposal networks for multispectral person detection","author":"Konig","year":"2017"},{"key":"10.1016\/j.eswa.2026.132619_bib0018","doi-asserted-by":"crossref","first-page":"144","DOI":"10.1016\/j.patrec.2024.02.012","article-title":"CrossFormer: Cross-guided attention for multi-modal object detection","volume":"179","author":"Lee","year":"2024","journal-title":"Pattern Recognition Letters"},{"key":"10.1016\/j.eswa.2026.132619_bib0019","unstructured":"Li, C., Song, D., Tong, R., & Tang, M. Multispectral pedestrian detection via simultaneous detection and segmentation. In British machine vision conference (BMVC)."},{"key":"10.1016\/j.eswa.2026.132619_bib0020","doi-asserted-by":"crossref","first-page":"161","DOI":"10.1016\/j.patcog.2018.08.005","article-title":"Illumination-aware faster r-CNN for robust multispectral pedestrian detection","volume":"85","author":"Li","year":"2019","journal-title":"Pattern Recognition"},{"key":"10.1016\/j.eswa.2026.132619_bib0021","series-title":"Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition","first-page":"6458","article-title":"Frequency-aware discriminative feature learning supervised by single-center loss for face forgery detection","author":"Li","year":"2021"},{"key":"10.1016\/j.eswa.2026.132619_bib0022","series-title":"Proceedings of the AAAI conference on artificial intelligence","first-page":"4797","article-title":"FD2-Net: Frequency-driven feature decomposition network for infrared-visible object detection","volume":"vol. 39","author":"Li","year":"2025"},{"key":"10.1016\/j.eswa.2026.132619_bib0023","doi-asserted-by":"crossref","first-page":"852","DOI":"10.1109\/TMM.2023.3272471","article-title":"Multiscale cross-modal homogeneity enhancement and confidence-aware fusion for multispectral pedestrian detection","volume":"26","author":"Li","year":"2023","journal-title":"IEEE Transactions on Multimedia"},{"issue":"5","key":"10.1016\/j.eswa.2026.132619_bib0024","doi-asserted-by":"crossref","first-page":"4716","DOI":"10.1109\/TITS.2023.3248483","article-title":"Emergent visual sensors for autonomous vehicles","volume":"24","author":"Li","year":"2023","journal-title":"IEEE Transactions on Intelligent Transportation Systems"},{"key":"10.1016\/j.eswa.2026.132619_bib0025","doi-asserted-by":"crossref","DOI":"10.1016\/j.knosys.2025.114365","article-title":"Frequency-driven deep learning network for image splicing forgery detection","volume":"330","author":"Liang","year":"2025","journal-title":"Knowledge-Based Systems"},{"key":"10.1016\/j.eswa.2026.132619_bib0026","series-title":"Proceedings of the IEEE conference on computer vision and pattern recognition","first-page":"2117","article-title":"Feature pyramid networks for object detection","author":"Lin","year":"2017"},{"key":"10.1016\/j.eswa.2026.132619_bib0027","unstructured":"Liu, J., Zhang, S., Wang, S., & Metaxas, D. N. (2016a). Multispectral deep neural networks for pedestrian detection. arXiv preprint arXiv: 1611.02644."},{"key":"10.1016\/j.eswa.2026.132619_bib0028","unstructured":"Liu, Q., Pi, J., Li, X., Yuan, D., He, Z., & Chang, X. Self-supervised transformer for infrared and visible image fusion. Available at SSRN 4279998."},{"key":"10.1016\/j.eswa.2026.132619_bib0029","series-title":"European conference on computer vision","first-page":"21","article-title":"SSD: Single shot multibox detector","author":"Liu","year":"2016"},{"issue":"6","key":"10.1016\/j.eswa.2026.132619_bib0030","doi-asserted-by":"crossref","first-page":"5441","DOI":"10.1109\/LRA.2024.3392083","article-title":"FDENet: Fusion depth semantics and edge-attention information for multispectral pedestrian detection","volume":"9","author":"Liu","year":"2024","journal-title":"IEEE Robotics and Automation Letters"},{"key":"10.1016\/j.eswa.2026.132619_bib0031","doi-asserted-by":"crossref","DOI":"10.1016\/j.knosys.2025.113195","article-title":"Camera-aware embedding refinement for unsupervised person re-identification","volume":"314","author":"Liu","year":"2025","journal-title":"Knowledge-Based Systems"},{"key":"10.1016\/j.eswa.2026.132619_bib0032","first-page":"1","article-title":"Frequency spectrum features modeling for real-time tiny object detection in remote sensing image","volume":"21","author":"Luo","year":"2024","journal-title":"IEEE Geoscience and Remote Sensing Letters"},{"key":"10.1016\/j.eswa.2026.132619_bib0033","doi-asserted-by":"crossref","first-page":"143","DOI":"10.1016\/j.patcog.2018.03.007","article-title":"Unified multi-spectral pedestrian detection based on probabilistic fusion networks","volume":"80","author":"Park","year":"2018","journal-title":"Pattern Recognition"},{"issue":"8","key":"10.1016\/j.eswa.2026.132619_bib0034","doi-asserted-by":"crossref","first-page":"2041","DOI":"10.3390\/rs15082041","article-title":"HAFNet: Hierarchical attentive fusion network for multispectral pedestrian detection","volume":"15","author":"Peng","year":"2023","journal-title":"Remote Sensing"},{"key":"10.1016\/j.eswa.2026.132619_bib0035","unstructured":"Qingyun, F., Dapeng, H., & Zhaokui, W. (2021). Cross-modality fusion transformer for multispectral object detection. arXiv preprint arXiv: 2111.00273."},{"key":"10.1016\/j.eswa.2026.132619_bib0036","unstructured":"Simonyan, K., & Zisserman, A. (2014). Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv: 1409.1556."},{"key":"10.1016\/j.eswa.2026.132619_bib0037","first-page":"1","article-title":"Joint classification of hyperspectral and liDAR data using height information guided hierarchical fusion-and-separation network","volume":"62","author":"Song","year":"2024","journal-title":"IEEE Transactions on Geoscience and Remote Sensing"},{"key":"10.1016\/j.eswa.2026.132619_bib0038","doi-asserted-by":"crossref","first-page":"6449","DOI":"10.1109\/TMM.2024.3350926","article-title":"Cross-modality proposal-guided feature mining for unregistered RGB-thermal pedestrian detection","volume":"26","author":"Tian","year":"2024","journal-title":"IEEE Transactions on Multimedia"},{"key":"10.1016\/j.eswa.2026.132619_bib0039","series-title":"Esann","first-page":"509","article-title":"Multispectral pedestrian detection using deep fusion convolutional neural networks","volume":"vol. 587","author":"Wagner","year":"2016"},{"issue":"9","key":"10.1016\/j.eswa.2026.132619_bib0040","doi-asserted-by":"crossref","first-page":"2020","DOI":"10.3390\/rs14092020","article-title":"Improving RGB-infrared object detection by reducing cross-modality redundancy","volume":"14","author":"Wang","year":"2022","journal-title":"Remote Sensing"},{"key":"10.1016\/j.eswa.2026.132619_bib0041","series-title":"2025 IEEE 101st vehicular technology conference (VTC2025-spring)","first-page":"1","article-title":"WCANet: Wavelet-based cross-attention framework for multispectral pedestrian detection in intelligent transportation systems","author":"Wang","year":"2025"},{"issue":"4","key":"10.1016\/j.eswa.2026.132619_bib0042","doi-asserted-by":"crossref","first-page":"7584","DOI":"10.1109\/JSEN.2024.3523269","article-title":"OCTNet: Illumination-aware octave fusion and feature enhancement for multispectral pedestrian detection","volume":"25","author":"Wang","year":"2025","journal-title":"IEEE Sensors Journal"},{"key":"10.1016\/j.eswa.2026.132619_bib0043","unstructured":"Wang, X., Chai, L., Chen, J., & Shi, Z. (2023). WCCNet: Wavelet-integrated CNN with crossmodal rearranging fusion for fast multispectral pedestrian detection. arXiv preprint arXiv: 2308.01042."},{"key":"10.1016\/j.eswa.2026.132619_bib0044","series-title":"Proceedings of the 30th ACM international conference on multimedia","first-page":"4043","article-title":"Learning a dynamic cross-modal network for multispectral pedestrian detection","author":"Xie","year":"2022"},{"key":"10.1016\/j.eswa.2026.132619_bib0045","doi-asserted-by":"crossref","DOI":"10.1016\/j.inffus.2025.102939","article-title":"Efficient multispectral object detection with attentive feature aggregation leveraging zero-shot implicit illumination guidance","volume":"118","author":"Xiong","year":"2025","journal-title":"Information Fusion"},{"key":"10.1016\/j.eswa.2026.132619_bib0046","series-title":"Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition","first-page":"1740","article-title":"Learning in the frequency domain","author":"Xu","year":"2020"},{"key":"10.1016\/j.eswa.2026.132619_bib0047","series-title":"2022 International conference on robotics and automation (ICRA)","first-page":"2920","article-title":"BAANet: Learning bi-directional adaptive attention gates for multispectral pedestrian detection","author":"Yang","year":"2022"},{"key":"10.1016\/j.eswa.2026.132619_bib0048","article-title":"CMMDL: Cross-modal multi-domain learning method for image fusion","volume":"196","author":"Yuan","year":"2025","journal-title":"Neural Networks"},{"key":"10.1016\/j.eswa.2026.132619_bib0049","series-title":"2020 IEEE International conference on image processing (ICIP)","first-page":"276","article-title":"Multispectral fusion for object detection with cyclic fuse-and-refine blocks","author":"Zhang","year":"2020"},{"key":"10.1016\/j.eswa.2026.132619_bib0050","series-title":"Proceedings of the IEEE\/CVF winter conference on applications of computer vision","first-page":"72","article-title":"Guided attentive feature fusion for multispectral pedestrian detection","author":"Zhang","year":"2021"},{"key":"10.1016\/j.eswa.2026.132619_bib0051","doi-asserted-by":"crossref","first-page":"20","DOI":"10.1016\/j.inffus.2018.09.015","article-title":"Cross-modality interactive attention network for multispectral pedestrian detection","volume":"50","author":"Zhang","year":"2019","journal-title":"Information Fusion"},{"key":"10.1016\/j.eswa.2026.132619_bib0052","series-title":"Proceedings of the IEEE\/CVF international conference on computer vision","first-page":"5127","article-title":"Weakly aligned cross-modal learning for multispectral pedestrian detection","author":"Zhang","year":"2019"},{"key":"10.1016\/j.eswa.2026.132619_bib0053","doi-asserted-by":"crossref","first-page":"13276","DOI":"10.1109\/TNNLS.2024.3443455","article-title":"TFDet: Target-aware fusion for RGB-T pedestrian detection","volume":"36","author":"Zhang","year":"2024","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"key":"10.1016\/j.eswa.2026.132619_bib0054","unstructured":"Zhao, T., Yuan, M., Jiang, F., Wang, N., & Wei, X. (2024). Removal and selection: Improving RGB-infrared object detection via coarse-to-fine fusion. arXiv preprint arXiv: 2401.10731."},{"key":"10.1016\/j.eswa.2026.132619_bib0055","series-title":"European conference on computer vision","first-page":"787","article-title":"Improving multispectral pedestrian detection by addressing modality imbalance problems","author":"Zhou","year":"2020"},{"key":"10.1016\/j.eswa.2026.132619_bib0056","series-title":"Proceedings of the IEEE\/CVF international conference on computer vision","first-page":"11219","article-title":"WaveMamba: Wavelet-driven mamba fusion for RGB-infrared object detection","author":"Zhu","year":"2025"}],"container-title":["Expert Systems with Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0957417426015320?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0957417426015320?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,5,9]],"date-time":"2026-05-09T06:52:53Z","timestamp":1778309573000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0957417426015320"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,9]]},"references-count":56,"alternative-id":["S0957417426015320"],"URL":"https:\/\/doi.org\/10.1016\/j.eswa.2026.132619","relation":{},"ISSN":["0957-4174"],"issn-type":[{"value":"0957-4174","type":"print"}],"subject":[],"published":{"date-parts":[[2026,9]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"FDDF: Frequency decomposition and spatial-frequency dual-domain fusion network for multi-spectral pedestrian detection","name":"articletitle","label":"Article Title"},{"value":"Expert Systems with Applications","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.eswa.2026.132619","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier Ltd. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"132619"}}