{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T19:34:45Z","timestamp":1776886485935,"version":"3.51.2"},"reference-count":98,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,12,27]],"date-time":"2025-12-27T00:00:00Z","timestamp":1766793600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,12,27]],"date-time":"2025-12-27T00:00:00Z","timestamp":1766793600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2026,1]]},"DOI":"10.1007\/s11263-025-02668-0","type":"journal-article","created":{"date-parts":[[2025,12,27]],"date-time":"2025-12-27T07:49:37Z","timestamp":1766821777000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":11,"title":["Contourlet Refinement Gate Framework for Thermal Spectrum Distribution Regularized Infrared Image Super-Resolution"],"prefix":"10.1007","volume":"134","author":[{"given":"Yang","family":"Zou","sequence":"first","affiliation":[]},{"given":"Zhixin","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Zhipeng","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Xingyuan","family":"Li","sequence":"additional","affiliation":[]},{"given":"Long","family":"Ma","sequence":"additional","affiliation":[]},{"given":"Jinyuan","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Peng","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Yanning","family":"Zhang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,12,27]]},"reference":[{"issue":"16","key":"2668_CR1","doi-asserted-by":"publisher","first-page":"25107","DOI":"10.1007\/s11042-023-14417-x","volume":"82","author":"J Alfred Daniel","year":"2023","unstructured":"Alfred Daniel, J., Chandru Vignesh, C., Muthu, B. A., Senthil Kumar, R., Sivaparthipan, C. B., & Marin, C. E. M. (2023). Fully convolutional neural networks for lidar-camera fusion for pedestrian detection in autonomous vehicle. Multimedia Tools and Applications, 82(16), 25107\u201325130.","journal-title":"Multimedia Tools and Applications"},{"key":"2668_CR2","doi-asserted-by":"crossref","unstructured":"Avrahami, O., Lischinski, D., & Fried, O. (2022). Blended diffusion for text-driven editing of natural images. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 18208\u201318218","DOI":"10.1109\/CVPR52688.2022.01767"},{"key":"2668_CR3","doi-asserted-by":"crossref","unstructured":"Brooks, T., Holynski, A., & Efros, A. A. (2023). Instructpix2pix: Learning to follow image editing instructions. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 18392\u201318402","DOI":"10.1109\/CVPR52729.2023.01764"},{"key":"2668_CR4","doi-asserted-by":"crossref","unstructured":"Cao, H., Wang, Y., Chen, J., Jiang, D., Zhang, X., Tian, Q., & Wang, M. (2022) Swin-unet: Unet-like pure transformer for medical image segmentation. In: Proceedings of the European Conference on Computer Vision, Springer, 205\u2013218","DOI":"10.1007\/978-3-031-25066-8_9"},{"issue":"3","key":"2668_CR5","first-page":"7","volume":"2","author":"J Cao","year":"2021","unstructured":"Cao, J., Li, Y., Zhang, K., & Van Gool, L. (2021). Video super-resolution transformer., 2(3), 7. arXiv:2106.06847.","journal-title":"Video super-resolution transformer."},{"key":"2668_CR6","doi-asserted-by":"crossref","unstructured":"Carion, N., Massa, F., Synnaeve, G., Usunier, N., Kirillov, A., & Zagoruyko, S. (2020) End-to-end object detection with transformers. In: Proceedings of the European Conference on Computer Vision, 213\u2013229","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"2668_CR7","doi-asserted-by":"crossref","unstructured":"Chen, H., Wang, Y., Guo, T. et al (2021a) Pre-trained image processing transformer. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 12299\u201312310","DOI":"10.1109\/CVPR46437.2021.01212"},{"key":"2668_CR8","doi-asserted-by":"crossref","unstructured":"Chen, J., Yu, W., Tian, X., et al. (2024). Mdbfusion: A visible and infrared image fusion framework capable for motion deblurring. In: Proceedings of the IEEE International Conference on Image Processing, pp 1019\u20131025","DOI":"10.1109\/ICIP51287.2024.10647563"},{"issue":"102","key":"2668_CR9","doi-asserted-by":"publisher","first-page":"520","DOI":"10.1016\/j.scs.2020.102520","volume":"66","author":"L Chen","year":"2021","unstructured":"Chen, L., Tang, R., Anisetti, M., et al. (2021). A lightweight iterative error reconstruction network for infrared image super-resolution in smart grid. Sustainable Cities and Society, 66(102), 520. https:\/\/doi.org\/10.1016\/j.scs.2020.102520","journal-title":"Sustainable Cities and Society"},{"key":"2668_CR10","unstructured":"Chen, X., Wang, X., & Zhang, W., et al. (2023a). Hat: Hybrid attention transformer for image restoration. arXiv:2309.05239"},{"key":"2668_CR11","doi-asserted-by":"crossref","unstructured":"Chen, X., Wang, X., & Zhou, J., et al. (2023b). Activating more pixels in image super-resolution transformer. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 22367\u201322377.","DOI":"10.1109\/CVPR52729.2023.02142"},{"key":"2668_CR12","unstructured":"Chen, Z., Zhang, Y., & Gu, J., et al. (2022). Cross aggregation transformer for image restoration. Advances in Neural Information Processing Systems 35:25478\u201325490."},{"key":"2668_CR13","doi-asserted-by":"crossref","unstructured":"Chen, Z., Zhang, Y., & Gu, J., et al. (2023c). Dual aggregation transformer for image super-resolution. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 12312\u201312321.","DOI":"10.1109\/ICCV51070.2023.01131"},{"issue":"12","key":"2668_CR14","doi-asserted-by":"publisher","first-page":"2091","DOI":"10.1109\/TIP.2005.859376","volume":"14","author":"MN Do","year":"2005","unstructured":"Do, M. N., & Vetterli, M. (2005). The contourlet transform: an efficient directional multiresolution image representation. IEEE Transactions on Image Processing, 14(12), 2091\u20132106.","journal-title":"IEEE Transactions on Image Processing"},{"key":"2668_CR15","doi-asserted-by":"crossref","unstructured":"Dong, C., Loy, C.C., & He, K., et al. (2014). Learning a deep convolutional network for image super-resolution. In: Proceedings of the European Conference on Computer Vision, pp 184\u2013199.","DOI":"10.1007\/978-3-319-10593-2_13"},{"issue":"2","key":"2668_CR16","doi-asserted-by":"publisher","first-page":"295","DOI":"10.1109\/TPAMI.2015.2439281","volume":"38","author":"C Dong","year":"2015","unstructured":"Dong, C., Loy, C. C., He, K., et al. (2015). Image super-resolution using deep convolutional networks. IEEE Transactions on Pattern Analysis and Machine Intelligence, 38(2), 295\u2013307.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2668_CR17","doi-asserted-by":"crossref","unstructured":"Dong, C., Loy, C.C., & Tang, X. (2016). Accelerating the super-resolution convolutional neural network. In: Proceedings of the European Conference on Computer Vision, Springer, pp 391\u2013407.","DOI":"10.1007\/978-3-319-46475-6_25"},{"key":"2668_CR18","unstructured":"Dosovitskiy, A., Beyer, L., & Kolesnikov, A., et al. (2020). An image is worth 16x16 words: Transformers for image recognition at scale. arXiv:2010.11929"},{"key":"2668_CR19","doi-asserted-by":"crossref","unstructured":"Fu, J., Liu, J., & Tian, H., et al. (2019). Dual attention network for scene segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 3146\u20133154.","DOI":"10.1109\/CVPR.2019.00326"},{"key":"2668_CR20","doi-asserted-by":"crossref","unstructured":"Gao, S., Liu, X., & Zeng, B., et al. (2023). Implicit diffusion models for continuous super-resolution. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 10021\u201310030.","DOI":"10.1109\/CVPR52729.2023.00966"},{"key":"2668_CR21","doi-asserted-by":"crossref","unstructured":"Glasner, D., Bagon, S., & Irani, M. (2009). Super-resolution from a single image. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 349\u2013356.","DOI":"10.1109\/ICCV.2009.5459271"},{"key":"2668_CR22","unstructured":"Hertz, A., Mokady, R., & Tenenbaum, J., et al. (2022). Prompt-to-prompt image editing with cross attention control. arXiv:2208.01626"},{"key":"2668_CR23","doi-asserted-by":"crossref","unstructured":"Hong, Y., Chang, Y., & Liang, J., et al. (2024). Light flickering guided reflection removal. International Journal of Computer Vision pp 1\u201321.","DOI":"10.1007\/s11263-024-02073-z"},{"key":"2668_CR24","doi-asserted-by":"publisher","first-page":"982","DOI":"10.1109\/LSP.2021.3077801","volume":"28","author":"Y Huang","year":"2021","unstructured":"Huang, Y., Jiang, Z., Lan, R., et al. (2021). Infrared image super-resolution via transfer learning and psrgan. IEEE Signal Processing Letters, 28, 982\u2013986.","journal-title":"IEEE Signal Processing Letters"},{"key":"2668_CR25","doi-asserted-by":"publisher","first-page":"982","DOI":"10.1109\/LSP.2021.3077801","volume":"28","author":"Y Huang","year":"2021","unstructured":"Huang, Y., Jiang, Z., Lan, R., et al. (2021). Infrared image super-resolution via transfer learning and psrgan. IEEE Signal Processing Letters, 28, 982\u2013986. https:\/\/doi.org\/10.1109\/LSP.2021.3077801","journal-title":"IEEE Signal Processing Letters"},{"key":"2668_CR26","unstructured":"Jia, C., Yang, Y., & Xia, Y., et al. (2021). Scaling up visual and vision-language representation learning with noisy text supervision. In: Proceedings of the International Conference on Machine Learning, pp 4904\u20134916."},{"key":"2668_CR27","doi-asserted-by":"crossref","unstructured":"Karras, T., Laine, S., & Aila, T. (2019). A style-based generator architecture for generative adversarial networks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 4401\u20134410.","DOI":"10.1109\/CVPR.2019.00453"},{"key":"2668_CR28","doi-asserted-by":"crossref","unstructured":"Kim, G., Kwon, T., & Ye, J.C. (2022). Diffusionclip: Text-guided diffusion models for robust image manipulation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 2426\u20132435.","DOI":"10.1109\/CVPR52688.2022.00246"},{"key":"2668_CR29","unstructured":"Kristan, M., Matas, J., & Leonardis, A., et al. (2015). The visual object tracking vot2015 challenge results. In: Proceedings of the IEEE International Conference on Computer Vision Workshops, pp 1\u201323."},{"issue":"8","key":"2668_CR30","doi-asserted-by":"publisher","first-page":"1243","DOI":"10.1109\/LGRS.2017.2704122","volume":"14","author":"S Lei","year":"2017","unstructured":"Lei, S., Shi, Z., & Zou, Z. (2017). Super-resolution for remote sensing images via local-global combined network. IEEE Geoscience and Remote Sensing Letters, 14(8), 1243\u20131247.","journal-title":"IEEE Geoscience and Remote Sensing Letters"},{"key":"2668_CR31","doi-asserted-by":"crossref","unstructured":"Li, G., Lv, J., & Tian, Y., et al. (2022a). Transformer-empowered multi-scale contextual matching and aggregation for multi-contrast mri super-resolution. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 20636\u201320645.","DOI":"10.1109\/CVPR52688.2022.01998"},{"key":"2668_CR32","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1016\/j.neucom.2022.01.029","volume":"479","author":"H Li","year":"2022","unstructured":"Li, H., Yang, Y., Chang, M., et al. (2022). Srdiff: Single image super-resolution with diffusion probabilistic models. Neurocomputing, 479, 47\u201359.","journal-title":"Neurocomputing"},{"key":"2668_CR33","unstructured":"Li, W., Zhou, K., & Qi, L., et al. (2020). Lapar: Linearly-assembled pixel-adaptive regression network for single image super-resolution and beyond. Advances in Neural Information Processing Systems 33:20343\u201320355."},{"key":"2668_CR34","unstructured":"Li, W., Lu, X., & Qian, S., et al. (2021). On efficient transformer-based image pre-training for low-level vision. arXiv:2112.10175"},{"key":"2668_CR35","doi-asserted-by":"crossref","unstructured":"Li, X., Liu, J., & Chen, Z., et al. (2024). Contourlet residual for prompt learning enhanced infrared image super-resolution. In: Proceedings of the European Conference on Computer Vision, pp 270\u2013288.","DOI":"10.1007\/978-3-031-72646-0_16"},{"key":"2668_CR36","doi-asserted-by":"crossref","unstructured":"Li, X., Wang, Z., & Zou, Y., et al. (2025). Difiisr: A diffusion model with gradient guidance for infrared image super-resolution. In: Proceedings of the Computer Vision and Pattern Recognition Conference, pp 7534\u20137544.","DOI":"10.1109\/CVPR52734.2025.00706"},{"key":"2668_CR37","doi-asserted-by":"crossref","unstructured":"Liang, J., Cao, J., & Sun, G., et al. (2021). Swinir: Image restoration using swin transformer. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 1833\u20131844.","DOI":"10.1109\/ICCVW54120.2021.00210"},{"key":"2668_CR38","doi-asserted-by":"crossref","unstructured":"Liang, J., Zeng, H., & Zhang, L. (2022a). Details or artifacts: A locally discriminative learning approach to realistic image super-resolution. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 5657\u20135666.","DOI":"10.1109\/CVPR52688.2022.00557"},{"key":"2668_CR39","doi-asserted-by":"crossref","unstructured":"Liang, J., Zeng, H., & Zhang, L. (2022b). Efficient and degradation-adaptive network for real-world image super-resolution. In: Proceedings of the European Conference on Computer Vision, Springer, pp 574\u2013591.","DOI":"10.1007\/978-3-031-19797-0_33"},{"key":"2668_CR40","doi-asserted-by":"crossref","unstructured":"Lim, B., Son, S., & Kim, H., et al. (2017). Enhanced deep residual networks for single image super-resolution. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition Workshops, pp 136\u2013144.","DOI":"10.1109\/CVPRW.2017.151"},{"key":"2668_CR41","doi-asserted-by":"crossref","unstructured":"Liu, J., Fan, X., & Huang, Z., et al. (2022). Target-aware dual adversarial learning and a multi-scenario multi-modality benchmark to fuse infrared and visible for object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 5802\u20135811.","DOI":"10.1109\/CVPR52688.2022.00571"},{"key":"2668_CR42","doi-asserted-by":"crossref","unstructured":"Liu, J., Liu, Z., & Wu, G., et al. (2023). Multi-interactive feature learning and a full-time multi-modality benchmark for image fusion and segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 8115\u20138124.","DOI":"10.1109\/ICCV51070.2023.00745"},{"key":"2668_CR43","doi-asserted-by":"crossref","unstructured":"Liu, J., Li, X., & Wang, Z., et al. (2024a). Promptfusion: Harmonized semantic prompt learning for infrared and visible image fusion. IEEE\/CAA Journal of Automatica Sinica.","DOI":"10.1109\/JAS.2024.124878"},{"issue":"5","key":"2668_CR44","doi-asserted-by":"publisher","first-page":"1748","DOI":"10.1007\/s11263-023-01952-1","volume":"132","author":"J Liu","year":"2024","unstructured":"Liu, J., Lin, R., Wu, G., et al. (2024). Coconet: Coupled contrastive learning network with multi-level feature ensemble for multi-modality image fusion. International Journal of Computer Vision, 132(5), 1748\u20131775.","journal-title":"International Journal of Computer Vision"},{"key":"2668_CR45","doi-asserted-by":"crossref","unstructured":"Liu, J., Wu, G., & Liu, Z., et al. (2024c). Infrared and visible image fusion: From data compatibility to task adaption. IEEE Transactions on Pattern Analysis and Machine Intelligence.","DOI":"10.1109\/TPAMI.2024.3521416"},{"key":"2668_CR46","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1007\/s11263-019-01247-4","volume":"128","author":"L Liu","year":"2020","unstructured":"Liu, L., Ouyang, W., Wang, X., et al. (2020). Deep learning for generic object detection: A survey. International Journal of Computer Vision, 128, 261\u2013318.","journal-title":"International Journal of Computer Vision"},{"issue":"6","key":"2668_CR47","doi-asserted-by":"publisher","first-page":"2636","DOI":"10.1109\/TNNLS.2020.3007412","volume":"32","author":"M Liu","year":"2020","unstructured":"Liu, M., Jiao, L., Liu, X., et al. (2020). C-cnn: Contourlet convolutional neural networks. IEEE Transactions on Neural Networks and Learning Systems, 32(6), 2636\u20132649.","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"key":"2668_CR48","unstructured":"Liu, Y., Sun, G., & Qiu, Y., et al. (2021a). Transformer in convolutional neural networks. 3. arXiv:2106.03180"},{"key":"2668_CR49","doi-asserted-by":"crossref","unstructured":"Liu, Z., Lin, Y., & Cao, Y., et al. (2021b). Swin transformer: Hierarchical vision transformer using shifted windows. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 10012\u201310022.","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"2668_CR50","doi-asserted-by":"crossref","unstructured":"Lugmayr, A., Danelljan, M., & Romero, A., et al. (2022). Repaint: Inpainting using denoising diffusion probabilistic models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 11461\u201311471.","DOI":"10.1109\/CVPR52688.2022.01117"},{"key":"2668_CR51","doi-asserted-by":"publisher","first-page":"153","DOI":"10.1016\/j.inffus.2018.02.004","volume":"45","author":"J Ma","year":"2019","unstructured":"Ma, J., Ma, Y., & Li, C. (2019). Infrared and visible image fusion methods and applications: A survey. Information Fusion, 45, 153\u2013178.","journal-title":"Information Fusion"},{"key":"2668_CR52","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1016\/j.inffus.2018.09.004","volume":"48","author":"J Ma","year":"2019","unstructured":"Ma, J., Yu, W., Liang, P., et al. (2019). Fusiongan: A generative adversarial network for infrared and visible image fusion. Information Fusion, 48, 11\u201326.","journal-title":"Information Fusion"},{"key":"2668_CR53","doi-asserted-by":"publisher","first-page":"512","DOI":"10.1007\/s11263-018-1117-z","volume":"127","author":"J Ma","year":"2019","unstructured":"Ma, J., Zhao, J., Jiang, J., et al. (2019). Locality preserving matching. International Journal of Computer Vision, 127, 512\u2013531.","journal-title":"International Journal of Computer Vision"},{"issue":"1","key":"2668_CR54","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1007\/s11263-020-01359-2","volume":"129","author":"J Ma","year":"2021","unstructured":"Ma, J., Jiang, X., Fan, A., et al. (2021). Image matching from handcrafted to deep features: A survey. International Journal of Computer Vision, 129(1), 23\u201379.","journal-title":"International Journal of Computer Vision"},{"key":"2668_CR55","unstructured":"Ma, L., Jin, D., & An, N., et al. (2023). Bilevel fast scene adaptation for low-light image enhancement. International Journal of Computer Vision 1\u201319"},{"key":"2668_CR56","doi-asserted-by":"crossref","unstructured":"Marivani, I., Tsiligianni, E., & Cornelis, B., et al. (2020). Joint image super-resolution via recurrent convolutional neural networks with coupled sparse priors. In: Proceedings of the IEEE International Conference on Image Processing, pp 868\u2013872","DOI":"10.1109\/ICIP40778.2020.9190644"},{"key":"2668_CR57","doi-asserted-by":"crossref","unstructured":"Mei, Y., Fan, Y., & Zhou, Y. (2021). Image super-resolution with non-local sparse attention. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 3517\u20133526","DOI":"10.1109\/CVPR46437.2021.00352"},{"issue":"130","key":"2668_CR58","first-page":"200","volume":"639","author":"Z Meng","year":"2025","unstructured":"Meng, Z., Han, K., He, Y., et al. (2025). Modeling detail feature connections for infrared image enhancement. Neurocomputing, 639(130), 200.","journal-title":"Neurocomputing"},{"key":"2668_CR59","doi-asserted-by":"crossref","unstructured":"Patashnik, O., Wu, Z., & Shechtman, E., et al. (2021). Styleclip: Text-driven manipulation of stylegan imagery. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 2085\u20132094","DOI":"10.1109\/ICCV48922.2021.00209"},{"issue":"7","key":"2668_CR60","doi-asserted-by":"publisher","first-page":"073101","DOI":"10.1117\/1.OE.60.7.073101","volume":"60","author":"H Patel","year":"2021","unstructured":"Patel, H., Chudasama, V., Prajapati, K., et al. (2021). Thermisrnet: an efficient thermal image super-resolution network. Optical Engineering, 60(7), 073101\u2013073101.","journal-title":"Optical Engineering"},{"key":"2668_CR61","doi-asserted-by":"crossref","unstructured":"Pu, M., Huang, Y., & Guan, Q., et al. (2018). Graphnet: Learning image pseudo annotations for weakly-supervised semantic segmentation. In: Proceedings of the 26th ACM International Conference on Multimedia, pp 483\u2013491","DOI":"10.1145\/3240508.3240542"},{"key":"2668_CR62","unstructured":"Radford, A., Kim, J.W., & Hallacy, C., et al. (2021). Learning transferable visual models from natural language supervision. In: Proceedings of the International Conference on Machine Learning, pp 8748\u20138763"},{"issue":"2","key":"2668_CR63","first-page":"3","volume":"1","author":"A Ramesh","year":"2022","unstructured":"Ramesh, A., Dhariwal, P., Nichol, A., et al. (2022). Hierarchical text-conditional image generation with clip latents., 1(2), 3. arXiv:2204.06125.","journal-title":"Hierarchical text-conditional image generation with clip latents."},{"key":"2668_CR64","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., & Lorenz, D., et al. (2022). High-resolution image synthesis with latent diffusion models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 10,684\u201310,695","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"2668_CR65","first-page":"36479","volume":"35","author":"C Saharia","year":"2022","unstructured":"Saharia, C., Chan, W., Saxena, S., et al. (2022). Photorealistic text-to-image diffusion models with deep language understanding. Advances in Neural Information Processing Systems, 35, 36479\u201336494.","journal-title":"Advances in Neural Information Processing Systems"},{"issue":"4","key":"2668_CR66","first-page":"4713","volume":"45","author":"C Saharia","year":"2022","unstructured":"Saharia, C., Ho, J., Chan, W., et al. (2022). Image super-resolution via iterative refinement. IEEE Transactions on Pattern Analysis and Machine Intelligence, 45(4), 4713\u20134726.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2668_CR67","doi-asserted-by":"publisher","first-page":"23815","DOI":"10.1007\/s11042-018-5915-7","volume":"78","author":"P Shamsolmoali","year":"2019","unstructured":"Shamsolmoali, P., Zareapoor, M., Jain, D. K., et al. (2019). Deep convolution network for surveillance records super-resolution. Multimedia Tools and Applications, 78, 23815\u201323829.","journal-title":"Multimedia Tools and Applications"},{"key":"2668_CR68","doi-asserted-by":"crossref","unstructured":"Shi, W., Caballero, J., & Husz\u00e1r, F., et al. (2016). Real-time single image and video super-resolution using an efficient sub-pixel convolutional neural network. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 1874\u20131883","DOI":"10.1109\/CVPR.2016.207"},{"key":"2668_CR69","doi-asserted-by":"publisher","first-page":"249","DOI":"10.1016\/j.dib.2017.09.038","volume":"15","author":"A Toet","year":"2017","unstructured":"Toet, A. (2017). The tno multiband image data collection. Data in Brief, 15, 249\u2013251.","journal-title":"Data in Brief"},{"key":"2668_CR70","unstructured":"Touvron, H., Cord, M., Douze, M., et al. (2021). Training data-efficient image transformers & distillation through attention. Proceedings of the International Conference on Machine Learning, 10347\u201310357."},{"key":"2668_CR71","doi-asserted-by":"crossref","unstructured":"Vaswani, A., Ramachandran, P., Srinivas, A., et al. (2021). Scaling local self-attention for parameter efficient visual backbones. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 12894\u201312904.","DOI":"10.1109\/CVPR46437.2021.01270"},{"key":"2668_CR72","first-page":"2","volume":"1","author":"X Wang","year":"2022","unstructured":"Wang, X., Xie, L., Dong, C., et al. (2022). Realesrgan: Training real-world blind super-resolution with pure synthetic data supplementary material. Computer Vision Foundation Open Access, 1, 2.","journal-title":"Computer Vision Foundation Open Access"},{"key":"2668_CR73","doi-asserted-by":"crossref","unstructured":"Wang, Y., Liu, Y., Zhao, S., et al. (2024). Camixersr: Only details need more\" attention\". Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 25837\u201325846.","DOI":"10.1109\/CVPR52733.2024.02441"},{"key":"2668_CR74","doi-asserted-by":"crossref","unstructured":"Wang, Y., Yang, W., Chen, X., et al. (2024). Sinsr: diffusion-based image super-resolution in a single step. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 25796\u201325805.","DOI":"10.1109\/CVPR52733.2024.02437"},{"issue":"4","key":"2668_CR75","doi-asserted-by":"publisher","first-page":"600","DOI":"10.1109\/TIP.2003.819861","volume":"13","author":"Z Wang","year":"2004","unstructured":"Wang, Z., Bovik, A. C., Sheikh, H. R., et al. (2004). Image quality assessment: from error visibility to structural similarity. IEEE Transactions on Image Processing, 13(4), 600\u2013612.","journal-title":"IEEE Transactions on Image Processing"},{"key":"2668_CR76","doi-asserted-by":"crossref","unstructured":"Whang, J., Delbracio, M., Talebi, H., et al. (2022). Deblurring via stochastic refinement. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 16293\u201316303.","DOI":"10.1109\/CVPR52688.2022.01581"},{"key":"2668_CR77","unstructured":"Wu, B., Xu, C., & Dai, X., et al. (2020). Visual transformers: Token-based image representation and processing for computer vision. arXiv:2006.03677"},{"key":"2668_CR78","unstructured":"Wu, R., Sun, L., & Ma, Z., et al. (2024). One-step effective diffusion network for real-world image super-resolution. arXiv:2406.08177"},{"key":"2668_CR79","doi-asserted-by":"crossref","unstructured":"Wu, Y., Lim, J., & Yang, M. H. (2013). Online object tracking: A benchmark. Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2411\u20132418.","DOI":"10.1109\/CVPR.2013.312"},{"key":"2668_CR80","doi-asserted-by":"crossref","unstructured":"Xia, B., Zhang, Y., Wang, S., et al. (2023). Diffir: Efficient diffusion model for image restoration. Proceedings of the IEEE\/CVF International Conference on Computer Vision, 13095\u201313105.","DOI":"10.1109\/ICCV51070.2023.01204"},{"issue":"1","key":"2668_CR81","doi-asserted-by":"publisher","first-page":"4272","DOI":"10.1038\/s41598-024-52370-3","volume":"14","author":"H Xiao","year":"2024","unstructured":"Xiao, H., Wang, X., Wang, J., et al. (2024). Single image super-resolution with denoising diffusion gans. Scientific Reports, 14(1), 4272.","journal-title":"Scientific Reports"},{"key":"2668_CR82","first-page":"12077","volume":"34","author":"E Xie","year":"2021","unstructured":"Xie, E., Wang, W., Yu, Z., et al. (2021). Segformer: Simple and efficient design for semantic segmentation with transformers. Advances in Neural Information Processing Systems, 34, 12077\u201312090.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2668_CR83","doi-asserted-by":"crossref","unstructured":"Xie, L., Wang, X., Chen, X., et al. (2023). Desra: detect and delete the artifacts of gan-based real-world super-resolution models. arXiv:2307.02457","DOI":"10.1609\/aaai.v37i3.25398"},{"issue":"1","key":"2668_CR84","doi-asserted-by":"publisher","first-page":"502","DOI":"10.1109\/TPAMI.2020.3012548","volume":"44","author":"H Xu","year":"2020","unstructured":"Xu, H., Ma, J., Jiang, J., et al. (2020). U2fusion: A unified unsupervised image fusion network. IEEE Transactions on Pattern Analysis and Machine Intelligence, 44(1), 502-518.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2668_CR85","doi-asserted-by":"crossref","unstructured":"Yang, D., Li, Z., Xia, Y., et al. (2015). Remote sensing image super-resolution: Challenges and approaches. Proceedings of the IEEE International Conference on Digital Signal Processing, 196\u2013200.","DOI":"10.1109\/ICDSP.2015.7251858"},{"key":"2668_CR86","doi-asserted-by":"publisher","first-page":"158690","DOI":"10.1109\/ACCESS.2020.3017819","volume":"8","author":"Y Yang","year":"2020","unstructured":"Yang, Y., Li, Q., Yang, C., et al. (2020). Deep networks with detail enhancement for infrared image super-resolution. IEEE Access, 8, 158690\u2013158701.","journal-title":"IEEE Access"},{"key":"2668_CR87","unstructured":"Yao, L., Huang, R., & Hou, L., et al. (2021). Filip: Fine-grained interactive language-image pre-training. arXiv:2111.07783"},{"key":"2668_CR88","doi-asserted-by":"crossref","unstructured":"Yilmaz, A., Javed, O., & Shah, M. (2006). Object tracking: A survey. ACM Computing Surveys (CSUR) 38(4):13\u2013es","DOI":"10.1145\/1177352.1177355"},{"key":"2668_CR89","unstructured":"Yue, Z., Wang, J., & Loy, C.C. (2024). Resshift: Efficient diffusion model for image super-resolution by residual shifting. Advances in Neural Information Processing Systems 36"},{"key":"2668_CR90","doi-asserted-by":"crossref","unstructured":"Zamir, S.W., Arora, A., & Khan, S., et al. (2022). Restormer: Efficient transformer for high-resolution image restoration. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 5728\u20135739","DOI":"10.1109\/CVPR52688.2022.00564"},{"key":"2668_CR91","unstructured":"Zhang, J., Zhang, Y., & Gu, J., et al. (2022a). Accurate image restoration with attention retractable transformer. arXiv:2210.01427"},{"key":"2668_CR92","doi-asserted-by":"crossref","unstructured":"Zhang, K., Liang, J., Van Gool, L., et al. (2021). Designing a practical degradation model for deep blind image super-resolution. Proceedings of the IEEE\/CVF International Conference on Computer Vision, 4791\u20134800.","DOI":"10.1109\/ICCV48922.2021.00477"},{"key":"2668_CR93","doi-asserted-by":"crossref","unstructured":"Zhang, X., Zeng, H., Guo, S., et al. (2022). Efficient long-range attention network for image super-resolution. Proceedings of the European Conference on Computer Vision, Springer, 649\u2013667.","DOI":"10.1007\/978-3-031-19790-1_39"},{"key":"2668_CR94","doi-asserted-by":"publisher","first-page":"1013","DOI":"10.1007\/s11263-020-01407-x","volume":"129","author":"Y Zhang","year":"2021","unstructured":"Zhang, Y., Guo, X., Ma, J., et al. (2021). Beyond brightening low-light images. International Journal of Computer Vision, 129, 1013\u20131037.","journal-title":"International Journal of Computer Vision"},{"key":"2668_CR95","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Li, K., Li, K., et al. (2021). Mr image super-resolution with squeeze and excitation reasoning attention network. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 13425\u201313434.","DOI":"10.1109\/CVPR46437.2021.01322"},{"issue":"3","key":"2668_CR96","doi-asserted-by":"publisher","first-page":"1186","DOI":"10.1109\/TCSVT.2021.3075745","volume":"32","author":"Z Zhao","year":"2021","unstructured":"Zhao, Z., Xu, S., Zhang, J., et al. (2021). Efficient and model-based infrared and visible image fusion via algorithm unrolling. IEEE Transactions on Circuits and Systems for Video Technology, 32(3), 1186\u20131196.","journal-title":"IEEE Transactions on Circuits and Systems for Video Technology"},{"key":"2668_CR97","doi-asserted-by":"crossref","unstructured":"Zheng, S., Lu, J., Zhao, H., et al. (2021). Rethinking semantic segmentation from a sequence-to-sequence perspective with transformers. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 6881\u20136890.","DOI":"10.1109\/CVPR46437.2021.00681"},{"key":"2668_CR98","doi-asserted-by":"crossref","unstructured":"Zou, Y., Zhang, L., Chen, Q., et al. (2020). An infrared image super-resolution imaging algorithm based on auxiliary convolution neural network. Proceedings of the Optics Imaging and Display, 335\u2013340.","DOI":"10.1117\/12.2581217"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02668-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-025-02668-0","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02668-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,20]],"date-time":"2026-02-20T15:44:12Z","timestamp":1771602252000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-025-02668-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,27]]},"references-count":98,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,1]]}},"alternative-id":["2668"],"URL":"https:\/\/doi.org\/10.1007\/s11263-025-02668-0","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,12,27]]},"assertion":[{"value":"8 November 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 September 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 December 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"23"}}