{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T11:05:01Z","timestamp":1773486301990,"version":"3.50.1"},"reference-count":62,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2026,2,9]],"date-time":"2026-02-09T00:00:00Z","timestamp":1770595200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,2,9]],"date-time":"2026-02-09T00:00:00Z","timestamp":1770595200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"Yunnan Fundamental Research Projects","award":["202301AW070007, 202201AT070112, 202301AU070210, 202401AT070470"],"award-info":[{"award-number":["202301AW070007, 202201AT070112, 202301AU070210, 202401AT070470"]}]},{"name":"Yunnan Province Expert Workstations","award":["202305AF150078"],"award-info":[{"award-number":["202305AF150078"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62261060"],"award-info":[{"award-number":["62261060"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100018531","name":"Major Science and Technology Projects in Yunnan Province","doi-asserted-by":"publisher","award":["202202AD080002"],"award-info":[{"award-number":["202202AD080002"]}],"id":[{"id":"10.13039\/501100018531","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Xingdian Talent Project in Yunnan Province"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Pattern Anal Applic"],"published-print":{"date-parts":[[2026,3]]},"DOI":"10.1007\/s10044-026-01622-1","type":"journal-article","created":{"date-parts":[[2026,2,9]],"date-time":"2026-02-09T17:49:50Z","timestamp":1770659390000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["TDFG-GAN: Top-down-feature guided GAN for thermal infrared image colorization"],"prefix":"10.1007","volume":"29","author":[{"given":"Yang","family":"Gao","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qian","family":"Jiang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kai","family":"Yang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hongyue","family":"Huang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xuyang","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wei","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xin","family":"Jin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,2,9]]},"reference":[{"issue":"3","key":"1622_CR1","doi-asserted-by":"publisher","first-page":"187","DOI":"10.1016\/S1350-4495(02)00140-8","volume":"43","author":"A Rogalski","year":"2002","unstructured":"Rogalski A (2002) Infrared detectors: an overview. Infrared Phys Technol 43(3):187\u2013210. https:\/\/doi.org\/10.1016\/S1350-4495(02)00140-8","journal-title":"Infrared Phys Technol"},{"key":"1622_CR2","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1016\/j.infrared.2013.03.006","volume":"60","author":"S Bagavathiappan","year":"2013","unstructured":"Bagavathiappan S, Lahiri BB, Saravanan T, Philip J, Jayakumar T (2013) Infrared thermography for condition monitoring\u2014a review. Infrared Phys Technol 60:35\u201355. https:\/\/doi.org\/10.1016\/j.infrared.2013.03.006","journal-title":"Infrared Phys Technol"},{"issue":"3","key":"1622_CR3","doi-asserted-by":"publisher","first-page":"136","DOI":"10.1016\/j.infrared.2010.12.003","volume":"54","author":"A Rogalski","year":"2011","unstructured":"Rogalski A (2011) Recent progress in infrared detector technologies. Infrared Phys Technol 54(3):136\u2013154. https:\/\/doi.org\/10.1016\/j.infrared.2010.12.003. (Proceedings of the International Conference on Quantum Structure Infrared Photodetector (QSIP) 2010)","journal-title":"Infrared Phys Technol"},{"issue":"4","key":"1622_CR4","doi-asserted-by":"publisher","first-page":"675","DOI":"10.1109\/TCE.2014.7027342","volume":"60","author":"F Erden","year":"2014","unstructured":"Erden F, \u00c7etin AE (2014) Hand gesture based remote control system using infrared sensors and a camera. IEEE Trans Consum Electron 60(4):675\u2013680. https:\/\/doi.org\/10.1109\/TCE.2014.7027342","journal-title":"IEEE Trans Consum Electron"},{"key":"1622_CR5","doi-asserted-by":"publisher","unstructured":"Bhat N, Saggu N, Kumar S (2020) Generating visible spectrum images from thermal infrared using conditional generative adversarial networks. In: 2020 5th International Conference on Communication and Electronics Systems (ICCES), pp 1390\u20131394. https:\/\/doi.org\/10.1109\/ICCES48766.2020.9137895","DOI":"10.1109\/ICCES48766.2020.9137895"},{"key":"1622_CR6","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2025.131865","volume":"660","author":"W Ma","year":"2026","unstructured":"Ma W, Jiang Q, Wang Q, Yu D, Huang Y, He B, Jin X (2026) Ycsc-unet: A y-shaped composite spatial channel network based on u-net for breast lesion ultrasound image segmentation. Neurocomputing 660:131865. https:\/\/doi.org\/10.1016\/j.neucom.2025.131865","journal-title":"Neurocomputing"},{"key":"1622_CR7","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2025.113105","volume":"163","author":"Q Jiang","year":"2026","unstructured":"Jiang Q, Yu H, Jin X, Wang P, Lee S-J, Yao S, Jiang H, Lan W, Zhou W (2026) Attention-guided network for infrared unmanned aerial vehicle target detection. Eng Appl Artif Intell 163:113105. https:\/\/doi.org\/10.1016\/j.engappai.2025.113105","journal-title":"Eng Appl Artif Intell"},{"key":"1622_CR8","doi-asserted-by":"publisher","DOI":"10.1016\/j.infrared.2025.105779","volume":"147","author":"S Guo","year":"2025","unstructured":"Guo S, Yi S, Chen M, Zhang Y (2025) Pifrnet: A progressive infrared feature-refinement network for single infrared image super-resolution. Infrared Phys Technol 147:105779. https:\/\/doi.org\/10.1016\/j.infrared.2025.105779","journal-title":"Infrared Phys Technol"},{"key":"1622_CR9","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2025.103894","volume":"127","author":"Q Jiang","year":"2026","unstructured":"Jiang Q, Zhou T, Yu D, Song Y, Yao S, Wang P, Jin X (2026) Gsu-fusion: a text-guided symmetric u-net framework for infrared and visible image fusion. Inf Fusion 127:103894. https:\/\/doi.org\/10.1016\/j.inffus.2025.103894","journal-title":"Inf Fusion"},{"issue":"3","key":"1622_CR10","doi-asserted-by":"publisher","first-page":"480","DOI":"10.1109\/TIV.2020.3039456","volume":"6","author":"M Schutera","year":"2021","unstructured":"Schutera M, Hussein M, Abhau J, Mikut R, Reischl M (2021) Night-to-day: online image-to-image translation for object detection within autonomous driving by night. IEEE Trans Intell Veh 6(3):480\u2013489. https:\/\/doi.org\/10.1109\/TIV.2020.3039456","journal-title":"IEEE Trans Intell Veh"},{"issue":"3","key":"1622_CR11","doi-asserted-by":"publisher","first-page":"2285","DOI":"10.1109\/TIV.2022.3221767","volume":"8","author":"R Song","year":"2023","unstructured":"Song R, Ai Y, Tian B, Chen L, Zhu F, Yao F (2023) Msfanet: a light weight object detector based on context aggregation and attention mechanism for autonomous mining truck. IEEE Trans Intell Veh 8(3):2285\u20132295. https:\/\/doi.org\/10.1109\/TIV.2022.3221767","journal-title":"IEEE Trans Intell Veh"},{"key":"1622_CR12","doi-asserted-by":"publisher","first-page":"20","DOI":"10.20517\/ir.2024.02","volume":"4","author":"H Han","year":"2024","unstructured":"Han H, Xue X, Li Q, Gao H, Wang R, Jiang R, Ren Z, Meng R, Li M, Guo Y et al (2024) Pig-ear detection from the thermal infrared image based on improved yolov8n. Intell Robot 4:20\u201338","journal-title":"Intell Robot"},{"key":"1622_CR13","doi-asserted-by":"publisher","DOI":"10.1016\/j.infrared.2021.103754","volume":"116","author":"Y He","year":"2021","unstructured":"He Y, Deng B, Wang H, Cheng L, Zhou K, Cai S, Ciampa F (2021) Infrared machine vision and infrared thermography with deep learning: a review. Infrared Phys Technol 116:103754. https:\/\/doi.org\/10.1016\/j.infrared.2021.103754","journal-title":"Infrared Phys Technol"},{"key":"1622_CR14","doi-asserted-by":"publisher","first-page":"245","DOI":"10.1007\/s00138-013-0570-5","volume":"25","author":"R Gade","year":"2014","unstructured":"Gade R, Moeslund TB (2014) Thermal cameras and applications: a survey. Mach Vis Appl 25:245\u2013262","journal-title":"Mach Vis Appl"},{"key":"1622_CR15","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2022.105006","volume":"114","author":"S Huang","year":"2022","unstructured":"Huang S, Jin X, Jiang Q, Liu L (2022) Deep learning for image colorization: current and future prospects. Eng Appl Artif Intell 114:105006. https:\/\/doi.org\/10.1016\/j.engappai.2022.105006","journal-title":"Eng Appl Artif Intell"},{"key":"1622_CR16","doi-asserted-by":"publisher","first-page":"478","DOI":"10.1016\/j.infrared.2017.07.010","volume":"85","author":"X Jin","year":"2017","unstructured":"Jin X, Jiang Q, Yao S, Zhou D, Nie R, Hai J, He K (2017) A survey of infrared and visual image fusion methods. Infrared Phys Technol 85:478\u2013501. https:\/\/doi.org\/10.1016\/j.infrared.2017.07.010","journal-title":"Infrared Phys Technol"},{"key":"1622_CR17","doi-asserted-by":"publisher","first-page":"426","DOI":"10.1016\/j.istruc.2021.12.055","volume":"37","author":"Y Tang","year":"2022","unstructured":"Tang Y, Zhu M, Chen Z, Wu C, Chen B, Li C, Li L (2022) Seismic performance evaluation of recycled aggregate concrete-filled steel tubular columns with field strain detected via a novel mark-free vision method. Structures 37:426\u2013441. https:\/\/doi.org\/10.1016\/j.istruc.2021.12.055","journal-title":"Structures"},{"issue":"3","key":"1622_CR18","doi-asserted-by":"publisher","first-page":"316","DOI":"10.1109\/TCE.2016.7613199","volume":"62","author":"J Kang","year":"2016","unstructured":"Kang J, Anderson DV, Hayes MH (2016) Face recognition for vehicle personalization with near infrared frame differencing. IEEE Trans Consum Electron 62(3):316\u2013324. https:\/\/doi.org\/10.1109\/TCE.2016.7613199","journal-title":"IEEE Trans Consum Electron"},{"key":"1622_CR19","doi-asserted-by":"publisher","DOI":"10.1016\/j.sigpro.2021.108007","volume":"183","author":"J Xu","year":"2021","unstructured":"Xu J, Lu K, Shi X, Qin S, Wang H, Ma J (2021) A denseunet generative adversarial network for near-infrared face image colorization. Signal Process 183:108007. https:\/\/doi.org\/10.1016\/j.sigpro.2021.108007","journal-title":"Signal Process"},{"key":"1622_CR20","doi-asserted-by":"crossref","unstructured":"Waxman AM, Gove AN, Siebert MC, Fay DA, Carrick JE, Racamato JP, Savoye ED, Burke BE, Reich RK, McGonagle WH, Craig DM (1996) Progress on color night vision: visible\/ir fusion, perception and search, and low-light ccd imaging. In: Defense, Security, and Sensing. https:\/\/api.semanticscholar.org\/CorpusID:122970219","DOI":"10.1117\/12.241025"},{"issue":"6","key":"1622_CR21","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3355089.3356561","volume":"38","author":"C Zou","year":"2019","unstructured":"Zou C, Mo H, Gao C, Du R, Fu H (2019) Language-based colorization of scene sketches. ACM Trans Graph 38(6):1\u201316. https:\/\/doi.org\/10.1145\/3355089.3356561","journal-title":"ACM Trans Graph"},{"key":"1622_CR22","doi-asserted-by":"publisher","DOI":"10.1016\/j.sigpro.2020.107616","volume":"174","author":"H Li","year":"2020","unstructured":"Li H, Li B, Tan S, Huang J (2020) Identification of deep network generated images using disparities in color components. Signal Process 174:107616. https:\/\/doi.org\/10.1016\/j.sigpro.2020.107616","journal-title":"Signal Process"},{"key":"1622_CR23","doi-asserted-by":"publisher","unstructured":"Dong X, Li W, Wang X, Wang Y (2019) Learning a deep convolutional network for colorization in monochrome-color dual-lens system. In: Proceedings of the Thirty-Third AAAI Conference on Artificial Intelligence and Thirty-First Innovative Applications of Artificial Intelligence Conference and Ninth AAAI Symposium on Educational Advances in Artificial Intelligence. AAAI\u201919\/IAAI\u201919\/EAAI\u201919. AAAI Press, ???. https:\/\/doi.org\/10.1609\/aaai.v33i01.33018255","DOI":"10.1609\/aaai.v33i01.33018255"},{"issue":"1","key":"1622_CR24","doi-asserted-by":"publisher","first-page":"502","DOI":"10.1109\/TPAMI.2020.3012548","volume":"44","author":"H Xu","year":"2022","unstructured":"Xu H, Ma J, Jiang J, Guo X, Ling H (2022) U2fusion: a unified unsupervised image fusion network. IEEE Trans Pattern Anal Mach Intell 44(1):502\u2013518. https:\/\/doi.org\/10.1109\/TPAMI.2020.3012548","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"1622_CR25","doi-asserted-by":"publisher","first-page":"8","DOI":"10.1016\/j.infrared.2017.02.005","volume":"82","author":"J Ma","year":"2017","unstructured":"Ma J, Zhou Z, Wang B, Zong H (2017) Infrared and visible image fusion based on visual saliency map and weighted least square optimization. Infrared Phys Technol 82:8\u201317. https:\/\/doi.org\/10.1016\/j.infrared.2017.02.005","journal-title":"Infrared Phys Technol"},{"key":"1622_CR26","doi-asserted-by":"crossref","unstructured":"Jiang Q, Zhou T, He Y, Ma W, Hou J, Ghani ASA, Miao S, Jin X (2025) Cmmf-net: a generative network based on clip-guided multi-modal feature fusion for thermal infrared image colorization. Intell Robot 5(1). https:\/\/doi.org\/10.20517\/ir.2025.03","DOI":"10.20517\/ir.2025.03"},{"issue":"3","key":"1622_CR27","doi-asserted-by":"publisher","first-page":"662","DOI":"10.20517\/ir.2025.34","volume":"5","author":"X Chen","year":"2025","unstructured":"Chen X, Yang R, Wu Y, Zhang H, Ranjitkar P, Postolache O, Zheng Y, Wang Z (2025) Towards intelligent shipping: image-enhanced ship detection and situation analysis in low-light scenes. Intell Robot 5(3):662\u201378. https:\/\/doi.org\/10.20517\/ir.2025.34","journal-title":"Intell Robot"},{"key":"1622_CR28","unstructured":"Irony R, Cohen-Or D, Lischinski D (2005) Colorization by example. In: Proceedings of the Sixteenth Eurographics Conference on Rendering Techniques. EGSR \u201905, pp 201\u2013210. Eurographics Association, Goslar, DEU"},{"issue":"1145\/1409060","key":"1622_CR29","first-page":"1409105","volume":"10","author":"X Liu","year":"2008","unstructured":"Liu X, Wan L, Qu Y, Wong T-T, Lin S, Leung C-S, Heng P-A (2008) Intrinsic colorization. ACM Trans Graph doi 10(1145\/1409060):1409105","journal-title":"ACM Trans Graph doi"},{"key":"1622_CR30","doi-asserted-by":"publisher","first-page":"126","DOI":"10.1007\/978-3-540-88690-7_10","volume-title":"Computer vision - ECCV 2008","author":"G Charpiat","year":"2008","unstructured":"Charpiat G, Hofmann M, Sch\u00f6lkopf B (2008) Automatic image colorization via multimodal predictions. In: Forsyth D, Torr P, Zisserman A (eds) Computer vision - ECCV 2008. Springer, Berlin, pp 126\u2013139"},{"key":"1622_CR31","doi-asserted-by":"publisher","DOI":"10.1016\/j.infrared.2020.103338","volume":"107","author":"X Kuang","year":"2020","unstructured":"Kuang X, Zhu J, Sui X, Liu Y, Liu C, Chen Q, Gu G (2020) Thermal infrared colorization via conditional generative adversarial network. Infrared Phys Technol 107:103338. https:\/\/doi.org\/10.1016\/j.infrared.2020.103338","journal-title":"Infrared Phys Technol"},{"key":"1622_CR32","doi-asserted-by":"publisher","first-page":"111159","DOI":"10.1109\/ACCESS.2020.3000481","volume":"8","author":"F Cheng","year":"2020","unstructured":"Cheng F, Shi J, Yun L, Cao X, Zhang J (2020) From coarse to fine (fc2f): a new scheme of colorizing thermal infrared images. IEEE Access 8:111159\u2013111171. https:\/\/doi.org\/10.1109\/ACCESS.2020.3000481","journal-title":"IEEE Access"},{"issue":"9","key":"1622_CR33","doi-asserted-by":"publisher","first-page":"15808","DOI":"10.1109\/TITS.2022.3145476","volume":"23","author":"F Luo","year":"2022","unstructured":"Luo F, Li Y, Zeng G, Peng P, Wang G, Li Y (2022) Thermal infrared image colorization for nighttime driving scenes with top-down guided attention. IEEE Trans Intell Transp Syst 23(9):15808\u201315823. https:\/\/doi.org\/10.1109\/TITS.2022.3145476","journal-title":"IEEE Trans Intell Transp Syst"},{"issue":"4","key":"1622_CR34","doi-asserted-by":"publisher","first-page":"2954","DOI":"10.1109\/TIV.2022.3218833","volume":"8","author":"H Liao","year":"2023","unstructured":"Liao H, Jiang Q, Jin X, Liu L, Liu L, Lee S-J, Zhou W (2023) Mugan: thermal infrared image colorization using mixed-skipping unet and generative adversarial network. IEEE Trans Intell Veh 8(4):2954\u20132969. https:\/\/doi.org\/10.1109\/TIV.2022.3218833","journal-title":"IEEE Trans Intell Veh"},{"issue":"3","key":"1622_CR35","doi-asserted-by":"publisher","first-page":"478","DOI":"10.1109\/TCE.2023.3280165","volume":"69","author":"Y He","year":"2023","unstructured":"He Y, Jin X, Jiang Q, Cheng Z, Wang P, Zhou W (2023) Lkat-gan: A gan for thermal infrared image colorization based on large kernel and attentionunet-transformer. IEEE Trans Consum Electron 69(3):478\u2013489. https:\/\/doi.org\/10.1109\/TCE.2023.3280165","journal-title":"IEEE Trans Consum Electron"},{"key":"1622_CR36","doi-asserted-by":"publisher","DOI":"10.1016\/j.infrared.2024.105673","volume":"145","author":"Q Jiang","year":"2025","unstructured":"Jiang Q, Yao G, Feng M, Jin X, Miao S, Gao Y, Cheng X (2025) Mcu-gan: colorization method for infrared images based on multi-convolution fusion and generative adversarial network. Infrared Phys Technol 145:105673. https:\/\/doi.org\/10.1016\/j.infrared.2024.105673","journal-title":"Infrared Phys Technol"},{"issue":"3","key":"1622_CR37","doi-asserted-by":"publisher","first-page":"663","DOI":"10.3390\/rs15030663","volume":"15","author":"S Yang","year":"2023","unstructured":"Yang S, Sun M, Lou X, Yang H, Zhou H (2023) An unpaired thermal infrared image translation method using gma-cyclegan. Remote Sens 15(3):663. https:\/\/doi.org\/10.3390\/rs15030663","journal-title":"Remote Sens"},{"key":"1622_CR38","doi-asserted-by":"publisher","DOI":"10.1007\/s00371-025-04165-4","author":"G Yao","year":"2025","unstructured":"Yao G, Jin X, Jiang Q et al (2025) Ds-gan: a dual sub-structure gan for thermal infrared image colorization using u-net with convnext and multi-scale large kernel attention. Vis Comput. https:\/\/doi.org\/10.1007\/s00371-025-04165-4","journal-title":"Vis Comput"},{"key":"1622_CR39","doi-asserted-by":"crossref","unstructured":"Berg A, Ahlberg J, Felsberg M (2018) Generating visible spectrum images from thermal infrared. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshops","DOI":"10.1109\/CVPRW.2018.00159"},{"key":"1622_CR40","doi-asserted-by":"publisher","unstructured":"Lin T-Y, Doll\u00e1r P, Girshick R, He K, Hariharan B, Belongie S (2017) Feature pyramid networks for object detection. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp 936\u2013944. https:\/\/doi.org\/10.1109\/CVPR.2017.106","DOI":"10.1109\/CVPR.2017.106"},{"key":"1622_CR41","unstructured":"Denton EL, Chintala S, Fergus R et al (2015) Deep generative image models using a laplacian pyramid of adversarial networks. Adv Neural Inf Process Syst 28"},{"key":"1622_CR42","unstructured":"Karras T, Aila T, Laine S, Lehtinen J (2018) Progressive growing of GANs for improved quality, stability, and variation. In: International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=Hk99zCeAb"},{"key":"1622_CR43","doi-asserted-by":"crossref","unstructured":"Chen Q, Koltun V (2017) Photographic image synthesis with cascaded refinement networks. In: Proceedings of the IEEE International Conference on Computer Vision, pp 1511\u20131520","DOI":"10.1109\/ICCV.2017.168"},{"key":"1622_CR44","doi-asserted-by":"crossref","unstructured":"Ding X, Zhang X, Han J, Ding G (2022) Scaling up your kernels to 31x31: revisiting large kernel design in cnns. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 11963\u201311975","DOI":"10.1109\/CVPR52688.2022.01166"},{"key":"1622_CR45","unstructured":"Liu S, Chen T, Chen X, Chen X, Xiao Q, Wu B, K\u00e4rkk\u00e4inen T, Pechenizkiy M, Mocanu DC, Wang Z (2023) More convnets in the 2020s: scaling up kernels beyond 51x51 using sparsity. In: The Eleventh International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=bXNl-myZkJl"},{"issue":"4","key":"1622_CR46","doi-asserted-by":"publisher","first-page":"733","DOI":"10.1007\/s41095-023-0364-2","volume":"9","author":"M-H Guo","year":"2023","unstructured":"Guo M-H, Lu C-Z, Liu Z-N, Cheng M-M, Hu S-M (2023) Visual attention network. Comput Vis Media 9(4):733\u2013752","journal-title":"Comput Vis Media"},{"key":"1622_CR47","doi-asserted-by":"publisher","unstructured":"Wang X, Girshick R, Gupta A, He K (2018) Non-local neural networks. In: 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 7794\u20137803. https:\/\/doi.org\/10.1109\/CVPR.2018.00813","DOI":"10.1109\/CVPR.2018.00813"},{"key":"1622_CR48","doi-asserted-by":"crossref","unstructured":"Ke T-W, Hwang J-J, Liu Z, Yu SX (2018) Adaptive affinity fields for semantic segmentation. In: Proceedings of the European Conference on Computer Vision (ECCV), pp 587\u2013602","DOI":"10.1007\/978-3-030-01246-5_36"},{"issue":"6","key":"1622_CR49","doi-asserted-by":"publisher","first-page":"6896","DOI":"10.1109\/TPAMI.2020.3007032","volume":"45","author":"Z Huang","year":"2023","unstructured":"Huang Z, Wang X, Wei Y, Huang L, Shi H, Liu W, Huang TS (2023) Ccnet: Criss-cross attention for semantic segmentation. IEEE Trans Pattern Anal Mach Intell 45(6):6896\u20136908. https:\/\/doi.org\/10.1109\/TPAMI.2020.3007032","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"1622_CR50","unstructured":"Gu A, Dao T (2024) Mamba: linear-time sequence modeling with selective state spaces. In: First Conference on Language Modeling"},{"key":"1622_CR51","first-page":"103031","volume":"37","author":"Y Liu","year":"2024","unstructured":"Liu Y, Tian Y, Zhao Y, Yu H, Xie L, Wang Y, Ye Q, Jiao J, Liu Y (2024) Vmamba: visual state space model. Adv Neural Inf Process Syst 37:103031\u2013103063","journal-title":"Adv Neural Inf Process Syst"},{"key":"1622_CR52","first-page":"578","volume-title":"Medical image computing and computer assisted intervention - MICCAI 2024","author":"Z Xing","year":"2024","unstructured":"Xing Z, Ye T, Yang Y, Liu G, Zhu L (2024) Segmamba: long-range sequential modeling mamba for 3d medical image segmentation. In: Linguraru MG, Dou Q, Feragen A, Giannarou S, Glocker B, Lekadir K, Schnabel JA (eds) Medical image computing and computer assisted intervention - MICCAI 2024. Springer, Cham, pp 578\u2013588"},{"key":"1622_CR53","doi-asserted-by":"crossref","unstructured":"Dang TDQ, Nguyen HH, Tiulpin A (2024) Log-vmamba: local-global vision mamba for medical image segmentation. In: Proceedings of the Asian Conference on Computer Vision, pp 548\u2013565","DOI":"10.1007\/978-981-96-0901-7_14"},{"key":"1622_CR54","doi-asserted-by":"publisher","unstructured":"Zhu J-Y, Park T, Isola P, Efros AA (2017) Unpaired image-to-image translation using cycle-consistent adversarial networks. In: 2017 IEEE International Conference on Computer Vision (ICCV), pp 2242\u20132251. https:\/\/doi.org\/10.1109\/ICCV.2017.244","DOI":"10.1109\/ICCV.2017.244"},{"key":"1622_CR55","doi-asserted-by":"publisher","unstructured":"Isola P, Zhu J-Y, Zhou T, Efros AA (2017) Image-to-image translation with conditional adversarial networks. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp 5967\u20135976. https:\/\/doi.org\/10.1109\/CVPR.2017.632","DOI":"10.1109\/CVPR.2017.632"},{"key":"1622_CR56","doi-asserted-by":"publisher","unstructured":"Hwang S, Park J, Kim N, Choi Y, Kweon IS (2015) Multispectral pedestrian detection: benchmark dataset and baseline. In: 2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp 1037\u20131045. https:\/\/doi.org\/10.1109\/CVPR.2015.7298706","DOI":"10.1109\/CVPR.2015.7298706"},{"key":"1622_CR57","doi-asserted-by":"publisher","unstructured":"Li S, Han B, Yu Z, Liu CH, Chen K, Wang S (2021) I2v-gan: unpaired infrared-to-visible video translation. In: Proceedings of the 29th ACM International Conference on Multimedia. MM \u201921, pp 3061\u20133069. Association for Computing Machinery, New York, NY, USA. https:\/\/doi.org\/10.1145\/3474085.3475445","DOI":"10.1145\/3474085.3475445"},{"key":"1622_CR58","unstructured":"Paszke A, Gross S, Massa F, Lerer A, Bradbury J, Chanan G, Killeen T, Lin Z, Gimelshein N, Antiga L et al (2019) Pytorch: an imperative style, high-performance deep learning library. Adv Neural Inf Process Syst 32"},{"key":"1622_CR59","unstructured":"Kingma DP, Ba J (2014) Adam: a method for stochastic optimization. arXiv preprint arXiv:1412.6980"},{"issue":"4","key":"1622_CR60","doi-asserted-by":"publisher","first-page":"600","DOI":"10.1109\/TIP.2003.819861","volume":"13","author":"Z Wang","year":"2004","unstructured":"Wang Z, Bovik AC, Sheikh HR, Simoncelli EP (2004) Image quality assessment: from error visibility to structural similarity. IEEE Trans Image Process 13(4):600\u2013612","journal-title":"IEEE Trans Image Process"},{"key":"1622_CR61","unstructured":"Kodali N, Abernethy J, Hays J, Kira Z (2017) On convergence and stability of gans. arXiv preprint arXiv:1705.07215"},{"key":"1622_CR62","unstructured":"Odena A, Buckman J, Olsson C, Brown T, Olah C, Raffel C, Goodfellow I (2018) Is generator conditioning causally related to gan performance? In: International Conference on Machine Learning, pp 3849\u20133858. PMLR"}],"container-title":["Pattern Analysis and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-026-01622-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10044-026-01622-1","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-026-01622-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T10:39:08Z","timestamp":1773484748000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10044-026-01622-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,9]]},"references-count":62,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,3]]}},"alternative-id":["1622"],"URL":"https:\/\/doi.org\/10.1007\/s10044-026-01622-1","relation":{},"ISSN":["1433-7541","1433-755X"],"issn-type":[{"value":"1433-7541","type":"print"},{"value":"1433-755X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2,9]]},"assertion":[{"value":"4 November 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 February 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"46"}}