{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,26]],"date-time":"2026-03-26T03:24:27Z","timestamp":1774495467964,"version":"3.50.1"},"reference-count":76,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2025,1,11]],"date-time":"2025-01-11T00:00:00Z","timestamp":1736553600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,11]],"date-time":"2025-01-11T00:00:00Z","timestamp":1736553600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"Research Start-up Funds of Sichuan Agricultural University","award":["031-2222996009"],"award-info":[{"award-number":["031-2222996009"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Machine Vision and Applications"],"published-print":{"date-parts":[[2025,3]]},"DOI":"10.1007\/s00138-024-01658-5","type":"journal-article","created":{"date-parts":[[2025,1,11]],"date-time":"2025-01-11T07:29:55Z","timestamp":1736580595000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Ipdm: identity preserving diffusion model for face sketch and photo synthesis"],"prefix":"10.1007","volume":"36","author":[{"given":"Duoxun","family":"Tang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xinhang","family":"Jiang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ying","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yuhang","family":"Dai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ye","family":"Lin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,1,11]]},"reference":[{"issue":"1","key":"1658_CR1","doi-asserted-by":"publisher","first-page":"50","DOI":"10.1109\/TCSVT.2003.818353","volume":"14","author":"X Tang","year":"2004","unstructured":"Tang, X., Wang, X.: Face sketch recognition. IEEE Trans. Circuits Syst. Video Technol. 14(1), 50\u201357 (2004)","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"issue":"11","key":"1658_CR2","doi-asserted-by":"publisher","first-page":"1955","DOI":"10.1109\/TPAMI.2008.222","volume":"31","author":"X Wang","year":"2008","unstructured":"Wang, X., Tang, X.: Face photo-sketch synthesis and recognition. IEEE Trans. Pattern Anal. Mach. Intell. 31(11), 1955\u20131967 (2008)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1658_CR3","doi-asserted-by":"publisher","first-page":"9","DOI":"10.1007\/s11263-013-0645-9","volume":"106","author":"N Wang","year":"2014","unstructured":"Wang, N., Tao, D., Gao, X., Li, X., Li, J.: A comprehensive survey to face hallucination. Int. J. Comput. Vision 106, 9\u201330 (2014)","journal-title":"Int. J. Comput. Vision"},{"issue":"5","key":"1658_CR4","doi-asserted-by":"publisher","first-page":"1419","DOI":"10.1109\/TNNLS.2018.2869574","volume":"30","author":"S Zhang","year":"2018","unstructured":"Zhang, S., Ji, R., Hu, J., Lu, X., Li, X.: Face sketch synthesis by multidomain adversarial learning. IEEE Trans. Neural Netw. Learn. Syst. 30(5), 1419\u20131428 (2018)","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"issue":"12","key":"1658_CR5","doi-asserted-by":"publisher","first-page":"15946","DOI":"10.1007\/s10489-022-04352-z","volume":"53","author":"W Wan","year":"2023","unstructured":"Wan, W., Yang, Y., Huang, S., Gan, L.: Fran: feature-filtered residual attention network for realistic face sketch-to-photo transformation. Appl. Intell. 53(12), 15946\u201315956 (2023). https:\/\/doi.org\/10.1007\/s10489-022-04352-z","journal-title":"Appl. Intell."},{"issue":"4","key":"1658_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2461912.2461964","volume":"32","author":"I Berger","year":"2013","unstructured":"Berger, I., Shamir, A., Mahler, M., Carter, E., Hodgins, J.: Style and abstraction in portrait sketching. ACM Trans. Graphics (TOG) 32(4), 1\u201312 (2013)","journal-title":"ACM Trans. Graphics (TOG)"},{"issue":"3","key":"1658_CR7","doi-asserted-by":"publisher","first-page":"904","DOI":"10.1109\/TCYB.2017.2664499","volume":"48","author":"M Zhang","year":"2017","unstructured":"Zhang, M., Li, J., Wang, N., Gao, X.: Compositional model-based sketch generator in facial entertainment. IEEE Trans. Cybern. 48(3), 904\u2013915 (2017)","journal-title":"IEEE Trans. Cybern."},{"issue":"6","key":"1658_CR8","first-page":"2701","volume":"50","author":"M Zhang","year":"2020","unstructured":"Zhang, M., Wang, N., Li, Y., Gao, X.: Bionic Face Sketch Generator. IEEE Trans. Syst. Man Cybern. 50(6), 2701\u20132714 (2020)","journal-title":"IEEE Trans. Syst. Man Cybern."},{"key":"1658_CR9","doi-asserted-by":"publisher","first-page":"8519","DOI":"10.1109\/TIP.2020.3016502","volume":"29","author":"C Peng","year":"2020","unstructured":"Peng, C., Wang, N., Li, J., Gao, X.: Universal face photo-sketch style transfer via multiview domain translation. IEEE Trans. Image Process. 29, 8519\u20138534 (2020)","journal-title":"IEEE Trans. Image Process."},{"issue":"1","key":"1658_CR10","doi-asserted-by":"publisher","first-page":"327","DOI":"10.1109\/TII.2021.3074989","volume":"18","author":"Y Lin","year":"2021","unstructured":"Lin, Y., Fu, K., Ling, S., Wang, J., Cheng, P.: Toward identity preserving face synthesis between sketches and photos using deep feature injection. IEEE Trans. Ind. Inf. 18(1), 327\u2013336 (2021)","journal-title":"IEEE Trans. Ind. Inf."},{"key":"1658_CR11","doi-asserted-by":"publisher","first-page":"1095","DOI":"10.1109\/LSP.2020.3005039","volume":"27","author":"Y Lin","year":"2020","unstructured":"Lin, Y., Ling, S., Fu, K., Cheng, P.: An identity-preserved model for face sketch-photo synthesis. IEEE Signal Process. Lett. 27, 1095\u20131099 (2020)","journal-title":"IEEE Signal Process. Lett."},{"key":"1658_CR12","doi-asserted-by":"crossref","unstructured":"Song, Y., Bao, L., Yang, Q., Yang, M.-H.: Real-time exemplar-based face sketch synthesis. In: Computer Vision\u2013ECCV 2014: 13th European Confrence, Zurich, Switzerland, September 6-12, 2014, Procedings, Part VI 13, pp. 800\u2013813. Springer (2014)","DOI":"10.1007\/978-3-319-10599-4_51"},{"key":"1658_CR13","doi-asserted-by":"crossref","unstructured":"Zhang, W., Wang, X., Tang, X.: Lighting and pose robust face sketch synthesis. In: Computer Vision\u2013ECCV 2010: 11th European Conference on Computer Vision, Heraklion, Crete, Greece, September 5-11, 2010, Proceedings, Part VI 11, pp. 420\u2013433 (2010). Springer","DOI":"10.1007\/978-3-642-15567-3_31"},{"key":"1658_CR14","doi-asserted-by":"crossref","unstructured":"Zhou, H., Kuang, Z., Wong, K.-Y.K.: Markov weight fields for face sketch synthesis. In: 2012 IEEE Conference on Computer Vision and Pattern Recognition, pp. 1091\u20131097. IEEE (2012)","DOI":"10.1109\/CVPR.2012.6247788"},{"key":"1658_CR15","doi-asserted-by":"crossref","unstructured":"Wang, L., Sindagi, V., Patel, V.: High-quality facial photo-sketch synthesis using multi-adversarial networks. In: 2018 13th IEEE International Conference on Automatic Face & Gesture Recognition (FG 2018), pp. 83\u201390. IEEE (2018)","DOI":"10.1109\/FG.2018.00022"},{"issue":"10","key":"1658_CR16","doi-asserted-by":"publisher","first-page":"3096","DOI":"10.1109\/TNNLS.2018.2890018","volume":"30","author":"M Zhu","year":"2019","unstructured":"Zhu, M., Li, J., Wang, N., Gao, X.: A deep collaborative framework for face photo-sketch synthesis. IEEE Trans. Neural Netw. Learn. Syst. 30(10), 3096\u20133108 (2019)","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"issue":"7","key":"1658_CR17","doi-asserted-by":"publisher","first-page":"2623","DOI":"10.1109\/TNNLS.2019.2933590","volume":"31","author":"M Zhang","year":"2020","unstructured":"Zhang, M., Wang, N., Li, Y., Gao, X.: Neural probabilistic graphical model for face sketch synthesis. IEEE Trans. Neural Netw. Learn. Syst. 31(7), 2623\u20132637 (2020). https:\/\/doi.org\/10.1109\/TNNLS.2019.2933590","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"1658_CR18","unstructured":"Goodfellow, I., Pouget-Abadie, J., Mirza, M., Xu, B., Warde-Farley, D., Ozair, S., Courville, A., Bengio, Y.: Generative adversarial nets. Adv. Neural Inf. Process. Syst. 27 (2014)"},{"key":"1658_CR19","doi-asserted-by":"crossref","unstructured":"Isola, P., Zhu, J.-Y., Zhou, T., Efros, A.A.: Image-to-image translation with conditional adversarial networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1125\u20131134 (2017)","DOI":"10.1109\/CVPR.2017.632"},{"key":"1658_CR20","unstructured":"Sohl-Dickstein, J., Weiss, E.A., Maheswaranathan, N., Ganguli, S.: Deep unsupervised learning using nonequilibrium thermodynamics. JMLR.org (2015)"},{"key":"1658_CR21","first-page":"6840","volume":"33","author":"J Ho","year":"2020","unstructured":"Ho, J., Jain, A., Abbeel, P.: Denoising diffusion probabilistic models. Adv. Neural Inf. Process. Syst. 33, 6840\u20136851 (2020)","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"1658_CR22","unstructured":"Song, J., Meng, C., Ermon, S.: Denoising diffusion implicit models. arXiv preprint arXiv:2010.02502 (2020)"},{"key":"1658_CR23","unstructured":"Nichol, A.Q., Dhariwal, P.: Improved denoising diffusion probabilistic models. In: International Conference on Machine Learning, pp. 8162\u20138171. PMLR (2021)"},{"key":"1658_CR24","first-page":"8780","volume":"34","author":"P Dhariwal","year":"2021","unstructured":"Dhariwal, P., Nichol, A.: Diffusion models beat gans on image synthesis. Adv. Neural. Inf. Process. Syst. 34, 8780\u20138794 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"1658_CR25","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P., Ommer, B.: High-resolution image synthesis with latent diffusion models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10684\u201310695 (2022)","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"1658_CR26","doi-asserted-by":"crossref","unstructured":"Saharia, C., Chan, W., Chang, H., Lee, C., Ho, J., Salimans, T., Fleet, D., Norouzi, M.: Palette: Image-to-image diffusion models. In: ACM SIGGRAPH 2022 Conference Proceedings, pp. 1\u201310 (2022)","DOI":"10.1145\/3528233.3530757"},{"key":"1658_CR27","doi-asserted-by":"crossref","unstructured":"Liu, Q., Tang, X., Jin, H., Lu, H., Ma, S.: A nonlinear approach for face sketch synthesis and recognition. In: 2005 IEEE Computer Society Conference on Computer Vision and Pattern Recognition (CVPR\u201905), vol. 1, pp. 1005\u20131010. IEEE (2005)","DOI":"10.1109\/CVPR.2005.39"},{"issue":"4","key":"1658_CR28","doi-asserted-by":"publisher","first-page":"487","DOI":"10.1109\/TCSVT.2008.918770","volume":"18","author":"X Gao","year":"2008","unstructured":"Gao, X., Zhong, J., Li, J., Tian, C.: Face sketch synthesis algorithm based on e-hmm and selective ensemble. IEEE Trans. Circuits Syst. Video Technol. 18(4), 487\u2013496 (2008)","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"key":"1658_CR29","doi-asserted-by":"crossref","unstructured":"Zhang, J., Wang, N., Gao, X., Tao, D., Li, X.: Face sketch-photo synthesis based on support vector regression. In: 2011 18th IEEE International Conference on Image Processing, pp. 1125\u20131128. IEEE (2011)","DOI":"10.1109\/ICIP.2011.6115625"},{"key":"1658_CR30","doi-asserted-by":"crossref","unstructured":"Ji, N., Chai, X., Shan, S., Chen, X.: Local regression model for automatic face sketch generation. In: 2011 Sixth International Conference on Image and Graphics, pp. 412\u2013417. IEEE (2011)","DOI":"10.1109\/ICIG.2011.84"},{"issue":"6","key":"1658_CR31","doi-asserted-by":"publisher","first-page":"7900","DOI":"10.1109\/TPAMI.2022.3217852","volume":"45","author":"H Ding","year":"2022","unstructured":"Ding, H., Liu, C., Wang, S., Jiang, X.: Vlt: vision-language transformer and query generation for referring segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 45(6), 7900\u20137916 (2022)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1658_CR32","doi-asserted-by":"crossref","unstructured":"Ding, H., Liu, C., He, S., Jiang, X., Torr, P.H., Bai, S.: Mose: A new dataset for video object segmentation in complex scenes. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 20224\u201320234 (2023)","DOI":"10.1109\/ICCV51070.2023.01850"},{"key":"1658_CR33","doi-asserted-by":"crossref","unstructured":"Liu, C., Ding, H., Jiang, X.: Gres: Generalized referring expression segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 23592\u201323601 (2023)","DOI":"10.1109\/CVPR52729.2023.02259"},{"key":"1658_CR34","doi-asserted-by":"crossref","unstructured":"Ding, H., Liu, C., He, S., Jiang, X., Loy, C.C.: Mevis: A large-scale benchmark for video segmentation with motion expressions. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 2694\u20132703 (2023)","DOI":"10.1109\/ICCV51070.2023.00254"},{"key":"1658_CR35","doi-asserted-by":"crossref","unstructured":"Li, X., Ding, H., Yuan, H., Zhang, W., Pang, J., Cheng, G., Chen, K., Liu, Z., Loy, C.C.: Transformer-based visual segmentation: a survey. IEEE Trans Pattern Anal. Mach. Intell. (2024)","DOI":"10.1109\/TPAMI.2024.3434373"},{"key":"1658_CR36","doi-asserted-by":"crossref","unstructured":"Wu, J., Li, X., Xu, S., Yuan, H., Ding, H., Yang, Y., Li, X., Zhang, J., Tong, Y., Jiang, X., et al.: Towards open vocabulary learning: a survey. IEEE Trans. Pattern Anal. Mach. Intell. (2024)","DOI":"10.1109\/TPAMI.2024.3361862"},{"key":"1658_CR37","doi-asserted-by":"crossref","unstructured":"Liu, C., Li, X., Ding, H.: Referring image editing: Object-level image editing via referring expressions. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13128\u201313138 (2024)","DOI":"10.1109\/CVPR52733.2024.01247"},{"key":"1658_CR38","doi-asserted-by":"crossref","unstructured":"Zhu, J.-Y., Park, T., Isola, P., Efros, A.A.: Unpaired image-to-image translation using cycle-consistent adversarial networks. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2223\u20132232 (2017)","DOI":"10.1109\/ICCV.2017.244"},{"key":"1658_CR39","doi-asserted-by":"publisher","first-page":"172","DOI":"10.1109\/TIFS.2019.2916633","volume":"15","author":"C Peng","year":"2019","unstructured":"Peng, C., Wang, N., Li, J., Gao, X.: Face sketch synthesis in the wild via deep patch representation-based probabilistic graphical model. IEEE Trans. Inf. Forensics Secur. 15, 172\u2013183 (2019)","journal-title":"IEEE Trans. Inf. Forensics Secur."},{"issue":"9","key":"1658_CR40","doi-asserted-by":"publisher","first-page":"4350","DOI":"10.1109\/TCYB.2020.2972944","volume":"51","author":"J Yu","year":"2020","unstructured":"Yu, J., Xu, X., Gao, F., Shi, S., Wang, M., Tao, D., Huang, Q.: Toward realistic face photo-sketch synthesis via composition-aided gans. IEEE Trans. Cybern. 51(9), 4350\u20134362 (2020)","journal-title":"IEEE Trans. Cybern."},{"issue":"13","key":"1658_CR41","doi-asserted-by":"publisher","first-page":"15295","DOI":"10.1007\/s10489-022-03302-z","volume":"52","author":"Y Zhang","year":"2022","unstructured":"Zhang, Y., Yu, L., Sun, B., He, J.: Eng-face: cross-domain heterogeneous face synthesis with enhanced asymmetric cyclegan. Appl. Intell. 52(13), 15295\u201315307 (2022). https:\/\/doi.org\/10.1007\/s10489-022-03302-z","journal-title":"Appl. Intell."},{"key":"1658_CR42","doi-asserted-by":"crossref","unstructured":"Zhao, Y., Ding, H., Huang, H., Cheung, N.-M.: A closer look at few-shot image generation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9140\u20139150 (2022)","DOI":"10.1109\/CVPR52688.2022.00893"},{"key":"1658_CR43","unstructured":"Arjovsky, M., Chintala, S., Bottou, L.: Wasserstein generative adversarial networks. In: International Conference on Machine Learning, pp. 214\u2013223. PMLR (2017)"},{"key":"1658_CR44","unstructured":"Gulrajani, I., Ahmed, F., Arjovsky, M., Dumoulin, V., Courville, A.C.: Improved training of wasserstein gans. Adv. Neural Inf. Process. Syst. 30 (2017)"},{"key":"1658_CR45","unstructured":"Batzolis, G., Stanczuk, J., Sch\u00f6nlieb, C.-B., Etmann, C.: Conditional image generation with score-based diffusion models. arXiv preprint arXiv:2111.13606 (2021)"},{"key":"1658_CR46","first-page":"23593","volume":"35","author":"B Kawar","year":"2022","unstructured":"Kawar, B., Elad, M., Ermon, S., Song, J.: Denoising diffusion restoration models. Adv. Neural Inf. Process. Syst. 35, 23593\u201323606 (2022)","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"1658_CR47","unstructured":"Wolleb, J., Sandk\u00fchler, R., Bieder, F., Cattin, P.C.: The swiss army knife for image-to-image translation: multi-task diffusion models. arXiv preprint arXiv:2204.02641 (2022)"},{"key":"1658_CR48","unstructured":"Su, X., Song, J., Meng, C., Ermon, S.: Dual diffusion implicit bridges for image-to-image translation. arXiv preprint arXiv:2203.08382 (2022)"},{"key":"1658_CR49","unstructured":"Sasaki, H., Willcocks, C.G., Breckon, T.P.: Unit-ddpm: unpaired image translation with denoising diffusion probabilistic models. arXiv preprint arXiv:2104.05358 (2021)"},{"key":"1658_CR50","doi-asserted-by":"crossref","unstructured":"Preechakul, K., Chatthee, N., Wizadwongsa, S., Suwajanakorn, S.: Diffusion autoencoders: toward a meaningful and decodable representation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10619\u201310629 (2022)","DOI":"10.1109\/CVPR52688.2022.01036"},{"key":"1658_CR51","unstructured":"Dong, J., Liang, W., Li, H., Zhang, D., Cao, M., Ding, H., Khan, S., Khan, F.: How to continually adapt text-to-image diffusion models for flexible customization? In: The Thirty-eighth Annual Conference on Neural Information Processing Systems"},{"key":"1658_CR52","unstructured":"Shuai, X., Ding, H., Ma, X., Tu, R., Jiang, Y.-G., Tao, D.: A survey of multimodal-guided image editing with text-to-image diffusion models. arXiv preprint arXiv:2406.14555 (2024)"},{"key":"1658_CR53","doi-asserted-by":"crossref","unstructured":"Li, B., Xue, K., Liu, B., Lai, Y.-K.: Bbdm: Image-to-image translation with brownian bridge diffusion models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 1952\u20131961 (2023)","DOI":"10.1109\/CVPR52729.2023.00194"},{"key":"1658_CR54","unstructured":"Peng, Y., Zhao, C., Xie, H., Fukusato, T., Miyata, K.: Difffacesketch: High-fidelity face image synthesis with sketch-guided latent diffusion model. arXiv preprint arXiv:2302.06908 (2023)"},{"key":"1658_CR55","doi-asserted-by":"crossref","unstructured":"Peng, Y., Zhao, C., Xie, H., Fukusato, T., Miyata, K.: Sketch-guided latent diffusion model for high-fidelity face image synthesis. IEEE Access (2023)","DOI":"10.1109\/ACCESS.2023.3346408"},{"key":"1658_CR56","doi-asserted-by":"crossref","unstructured":"Liu, J., Huang, H., Cao, J., Duan, J., He, R.: Fine-grained face sketch-photo synthesis with text-guided diffusion models. In: Asian Conference on Pattern Recognition, pp. 340\u2013354. Springer (2023)","DOI":"10.1007\/978-3-031-47637-2_26"},{"key":"1658_CR57","doi-asserted-by":"crossref","unstructured":"Que, Y., Xiong, L., Wan, W., Xia, X., Liu, Z.: Denoising diffusion probabilistic model for face sketch-to-photo synthesis. IEEE Trans. Circuits Syst. Video Technol. (2024)","DOI":"10.1109\/TCSVT.2024.3409184"},{"key":"1658_CR58","unstructured":"Martinez, A.M.: The AR face database. CVC Tech. Rep. 24 (1998)"},{"key":"1658_CR59","unstructured":"Messer, K., Matas, J., Kittler, J., Luettin, J., Maitre, G., et\u00a0al.: Xm2vtsdb: the extended m2vts database. In: Second International Conference on Audio and Video-based Biometric Person Authentication, vol. 964, pp. 965\u2013966. Citeseer (1999)"},{"issue":"10","key":"1658_CR60","doi-asserted-by":"publisher","first-page":"1090","DOI":"10.1109\/34.879790","volume":"22","author":"PJ Phillips","year":"2000","unstructured":"Phillips, P.J., Moon, H., Rizvi, S.A., Rauss, P.J.: The feret evaluation methodology for face-recognition algorithms. IEEE Trans. Pattern Anal. Mach. Intell. 22(10), 1090\u20131104 (2000)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"4","key":"1658_CR61","doi-asserted-by":"publisher","first-page":"600","DOI":"10.1109\/TIP.2003.819861","volume":"13","author":"Z Wang","year":"2004","unstructured":"Wang, Z., Bovik, A.C., Sheikh, H.R., Simoncelli, E.P.: Image quality assessment: from error visibility to structural similarity. IEEE Trans. Image Process. 13(4), 600\u2013612 (2004)","journal-title":"IEEE Trans. Image Process."},{"key":"1658_CR62","unstructured":"Wang, Z., Simoncelli, E.P., Bovik, A.C.: Multiscale structural similarity for image quality assessment. In: The Thrity-Seventh Asilomar Conference on Signals, Systems & Computers, 2003, vol. 2, pp. 1398\u20131402. IEEE (2003)"},{"issue":"13","key":"1658_CR63","doi-asserted-by":"publisher","first-page":"800","DOI":"10.1049\/el:20080522","volume":"44","author":"Q Huynh-Thu","year":"2008","unstructured":"Huynh-Thu, Q., Ghanbari, M.: Scope of validity of PSNR in image video quality assessment. Electron. Lett. 44(13), 800\u2013801 (2008)","journal-title":"Electron. Lett."},{"key":"1658_CR64","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"1658_CR65","doi-asserted-by":"crossref","unstructured":"Chen, S., Liu, Y., Gao, X., Han, Z.: Mobilefacenets: efficient CNNs for accurate real-time face verification on mobile devices. In: Biometric Recognition: 13th Chinese Conference, CCBR 2018, Urumqi, China, August 11\u201312, 2018, Proceedings 13, pp. 428\u2013438. Springer (2018)","DOI":"10.1007\/978-3-319-97909-0_46"},{"key":"1658_CR66","doi-asserted-by":"publisher","first-page":"3487","DOI":"10.1109\/TIP.2021.3061286","volume":"30","author":"F Gao","year":"2021","unstructured":"Gao, F., Xu, X., Yu, J., Shang, M., Li, X., Tao, D.: Complementary, heterogeneous and adversarial networks for image-to-image translation. IEEE Trans. Image Process. 30, 3487\u20133498 (2021)","journal-title":"IEEE Trans. Image Process."},{"key":"1658_CR67","unstructured":"Kingma, D., Ba, J.: Adam: A method for stochastic optimization. Comput. Sci. (2014)"},{"key":"1658_CR68","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Liu, W., Jia, Y., Sermanet, P., Reed, S., Anguelov, D., Erhan, D., Vanhoucke, V., Rabinovich, A.: Going deeper with convolutions. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1\u20139 (2015)","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"1658_CR69","doi-asserted-by":"crossref","unstructured":"Cao, Q., Shen, L., Xie, W., Parkhi, O.M., Zisserman, A.: Vggface2: a dataset for recognising faces across pose and age. IEEE Comput. Soc. (2017)","DOI":"10.1109\/FG.2018.00020"},{"issue":"11","key":"1658_CR70","doi-asserted-by":"publisher","first-page":"2884","DOI":"10.1109\/TIFS.2018.2833032","volume":"13","author":"X Wu","year":"2018","unstructured":"Wu, X., He, R., Sun, Z., Tan, T.: A light cnn for deep face representation with noisy labels. IEEE Trans. Inf. Forensics Secur. 13(11), 2884\u20132896 (2018)","journal-title":"IEEE Trans. Inf. Forensics Secur."},{"key":"1658_CR71","unstructured":"Yi, D., Lei, Z., Liao, S., Li, S.Z.: Learning face representation from scratch. Comput. Sci. (2014)"},{"key":"1658_CR72","volume-title":"Ms-celeb-1m: A Dataset and Benchmark for Large-scale Face Recognition","author":"Y Guo","year":"2016","unstructured":"Guo, Y., Zhang, L., Hu, Y., He, X., Gao, J.: Ms-celeb-1m: A Dataset and Benchmark for Large-scale Face Recognition. Springer, Cham (2016)"},{"key":"1658_CR73","unstructured":"Duta, I.C., Liu, L., Zhu, F., Shao, L.: Improved residual networks for image and video recognition. arXiv preprint arXiv:2004.04989 (2020)"},{"key":"1658_CR74","doi-asserted-by":"crossref","unstructured":"Esser, P., Rombach, R., Ommer, B.: Taming transformers for high-resolution image synthesis. In: Computer Vision and Pattern Recognition (2021)","DOI":"10.1109\/CVPR46437.2021.01268"},{"issue":"4","key":"1658_CR75","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1007\/s11633-022-1349-9","volume":"19","author":"D-P Fan","year":"2022","unstructured":"Fan, D.-P., Huang, Z., Zheng, P., Liu, H., Qin, X., Van Gool, L.: Facial-sketch synthesis: a new challenge. Mach. Intell. Res. 19(4), 257\u2013287 (2022)","journal-title":"Mach. Intell. Res."},{"key":"1658_CR76","doi-asserted-by":"publisher","unstructured":"Serengil, S.I., Ozpinar, A.: Lightface: a hybrid deep face recognition framework. In: 2020 Innovations in Intelligent Systems and Applications Conference (ASYU), pp. 23\u201327. IEEE (2020). https:\/\/doi.org\/10.1109\/ASYU50717.2020.9259802","DOI":"10.1109\/ASYU50717.2020.9259802"}],"container-title":["Machine Vision and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00138-024-01658-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00138-024-01658-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00138-024-01658-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,13]],"date-time":"2025-03-13T04:19:40Z","timestamp":1741839580000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00138-024-01658-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,1,11]]},"references-count":76,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2025,3]]}},"alternative-id":["1658"],"URL":"https:\/\/doi.org\/10.1007\/s00138-024-01658-5","relation":{},"ISSN":["0932-8092","1432-1769"],"issn-type":[{"value":"0932-8092","type":"print"},{"value":"1432-1769","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,1,11]]},"assertion":[{"value":"30 September 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 December 2024","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"31 December 2024","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 January 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no Conflict of interest to declare that are relevant to the content of this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"34"}}