{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T16:42:42Z","timestamp":1777567362534,"version":"3.51.4"},"reference-count":50,"publisher":"Tsinghua University Press","issue":"4","license":[{"start":{"date-parts":[[2023,12,1]],"date-time":"2023-12-01T00:00:00Z","timestamp":1701388800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"},{"start":{"date-parts":[[2023,7,27]],"date-time":"2023-07-27T00:00:00Z","timestamp":1690416000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Comp. Visual. Med."],"published-print":{"date-parts":[[2023,12]]},"DOI":"10.1007\/s41095-022-0331-3","type":"journal-article","created":{"date-parts":[[2023,7,27]],"date-time":"2023-07-27T05:01:37Z","timestamp":1690434097000},"page":"827-841","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":12,"title":["Pyramid-VAE-GAN: Transferring hierarchical latent variables for image inpainting"],"prefix":"10.26599","volume":"9","author":[{"given":"Huiyuan","family":"Tian","sequence":"first","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University, Hangzhou 310027, China"}]},{"given":"Li","family":"Zhang","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University, Hangzhou 310027, China; Advanced Technology Research Institute, Zhejiang University, Hangzhou 310027, China"}]},{"given":"Shijian","family":"Li","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University, Hangzhou 310027, China"}]},{"given":"Min","family":"Yao","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University, Hangzhou 310027, China"}]},{"given":"Gang","family":"Pan","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University, Hangzhou 310027, China"}]}],"member":"11138","reference":[{"key":"331_CR1","doi-asserted-by":"crossref","unstructured":"Bertalmio, M.; Sapiro, G.; Caselles, V.; Ballester, C. Image inpainting. In: Proceedings of the 27th Annual Conference on Computer Graphics and Interactive Techniques, 417\u2013424, 2000.","DOI":"10.1145\/344779.344972"},{"key":"331_CR2","doi-asserted-by":"publisher","first-page":"1784","DOI":"10.1109\/TIP.2020.3048629","volume":"30","author":"N Wang","year":"2021","unstructured":"Wang, N.; Zhang, Y. P.; Zhang, L. F. Dynamic selection network for image inpainting. IEEE Transactions on Image Processing Vol. 30, 1784\u20131798, 2021.","journal-title":"IEEE Transactions on Image Processing"},{"key":"331_CR3","doi-asserted-by":"crossref","unstructured":"Li, J. Y.; Wang, N.; Zhang, L. F.; Du, B.; Tao, D. C. Recurrent feature reasoning for image inpainting. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 7757\u20137765, 2020.","DOI":"10.1109\/CVPR42600.2020.00778"},{"key":"331_CR4","doi-asserted-by":"crossref","unstructured":"Wan, Z. Y.; Zhang, J. B.; Chen, D. D.; Liao, J. High-fidelity pluralistic image completion with transformers. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 4672\u20134681, 2021.","DOI":"10.1109\/ICCV48922.2021.00465"},{"issue":"5","key":"331_CR5","doi-asserted-by":"publisher","first-page":"858","DOI":"10.3390\/electronics9050858","volume":"9","author":"M Lu","year":"2020","unstructured":"Lu, M.; Niu, S. Z. A detection approach using LSTM-CNN for object removal caused by exemplar-based image inpainting. Electronics Vol. 9, No. 5, 858, 2020.","journal-title":"Electronics"},{"key":"331_CR6","unstructured":"Shetty, R.; Fritz, M.; Schiele, B. Adversarial scene editing: Automatic object removal from weak supervision. In: Proceedings of the 32nd International Conference on Neural Information Processing Systems, 7717\u20137727, 2018."},{"key":"331_CR7","doi-asserted-by":"crossref","unstructured":"Barnes, C.; Shechtman, E.; Finkelstein, A.; Goldman, D. B. PatchMatch: A randomized correspondence algorithm for structural image editing. ACM Transactions on Graphics Vol. 28, No. 3, Article No. 24, 2009.","DOI":"10.1145\/1531326.1531330"},{"key":"331_CR8","doi-asserted-by":"crossref","unstructured":"Pathak, D.; Kr\u00e4henb\u00fchl, P.; Donahue, J.; Darrell, T.; Efros, A. A. Context encoders: Feature learning by inpainting. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2536\u20132544, 2016.","DOI":"10.1109\/CVPR.2016.278"},{"key":"331_CR9","doi-asserted-by":"crossref","unstructured":"Yu, J. H.; Lin, Z.; Yang, J. M.; Shen, X. H.; Lu, X.; Huang, T. S. Generative image inpainting with contextual attention. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 5505\u20135514, 2018.","DOI":"10.1109\/CVPR.2018.00577"},{"issue":"6","key":"331_CR10","doi-asserted-by":"publisher","first-page":"660","DOI":"10.23919\/TST.2017.8195348","volume":"22","author":"X Wu","year":"2017","unstructured":"Wu, X.; Xu, K.; Hall, P. A survey of image synthesis and editing with generative adversarial networks. Tsinghua Science and Technology Vol. 22, No. 6, 660\u2013674, 2017.","journal-title":"Tsinghua Science and Technology"},{"issue":"1","key":"331_CR11","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1007\/s41095-021-0234-8","volume":"8","author":"Y Xue","year":"2022","unstructured":"Xue, Y.; Guo, Y. C.; Zhang, H.; Xu, T.; Zhang, S. H.; Huang, X. L. Deep image synthesis from intuitive user input: A review and perspectives. Computational Visual Media Vol. 8, No. 1, 3\u201331, 2022.","journal-title":"Computational Visual Media"},{"issue":"2","key":"331_CR12","doi-asserted-by":"publisher","first-page":"239","DOI":"10.1007\/s41095-021-0238-4","volume":"8","author":"X X Zeng","year":"2022","unstructured":"Zeng, X. X.; Wu, Z. L.; Peng, X. J.; Qiao, Y. Joint 3D facial shape reconstruction and texture completion from a single image. Computational Visual Media Vol. 8, No. 2, 239\u2013256, 2022.","journal-title":"Computational Visual Media"},{"key":"331_CR13","doi-asserted-by":"publisher","first-page":"2344","DOI":"10.1109\/TIP.2019.2945866","volume":"29","author":"X Wu","year":"2020","unstructured":"Wu, X.; Li, R. L.; Zhang, F. L.; Liu, J. C.; Wang, J.; Shamir, A.; Hu, S. M. Deep portrait image completion and extrapolation. IEEE Transactions on Image Processing Vol. 29, 2344\u20132355, 2020.","journal-title":"IEEE Transactions on Image Processing"},{"key":"331_CR14","doi-asserted-by":"crossref","unstructured":"Liu, H. Y.; Wan, Z. Y.; Huang, W.; Song, Y. B.; Han, X. T.; Liao, J. PD-GAN: Probabilistic diverse GAN for image inpainting. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 9367\u20139376, 2021.","DOI":"10.1109\/CVPR46437.2021.00925"},{"issue":"6","key":"331_CR15","doi-asserted-by":"publisher","first-page":"3460","DOI":"10.1007\/s10489-020-01971-2","volume":"51","author":"Y T Chen","year":"2021","unstructured":"Chen, Y. T.; Zhang, H. P.; Liu, L. W.; Chen, X.; Zhang, Q.; Yang, K.; Xia, R. L.; Xie, J. B. Research on image inpainting algorithm of improved GAN based on two-discriminations networks. Applied Intelligence Vol. 51, No. 6, 3460\u20133474, 2021.","journal-title":"Applied Intelligence"},{"issue":"11","key":"331_CR16","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1145\/3422622","volume":"63","author":"I Goodfellow","year":"2020","unstructured":"Goodfellow, I.; Pouget-Abadie, J.; Mirza, M.; Xu, B.; Warde-Farley, D.; Ozair, S.; Courville, A.; Bengio, Y. Generative adversarial networks. Communications of the ACM Vol. 63, No. 11, 139\u2013144, 2020.","journal-title":"Communications of the ACM"},{"key":"331_CR17","doi-asserted-by":"crossref","unstructured":"Zeng, Y. H.; Fu, J. L.; Chao, H. Y.; Guo, B. N. Learning pyramid-context encoder network for high-quality image inpainting. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 1486\u20131494, 2019.","DOI":"10.1109\/CVPR.2019.00158"},{"key":"331_CR18","unstructured":"Kingma, D. P.; Welling, M. Auto-encoding variational bayes. In: Proceedings of the International Conference on Learning Representations, 2014."},{"key":"331_CR19","unstructured":"Karras, T.; Aila, T. M.; Laine, S.; Lehtinen, J. Progressive growing of GANs for improved quality, stability, and variation. In: Proceedings of the International Conference on Learning Representations, 2018."},{"key":"331_CR20","doi-asserted-by":"crossref","unstructured":"Krause, J.; Stark, M.; Jia, D.; Li, F. F. 3D object representations for fine-grained categorization. In: Proceedings of the IEEE International Conference on Computer Vision Workshops, 554\u2013561, 2013.","DOI":"10.1109\/ICCVW.2013.77"},{"key":"331_CR21","doi-asserted-by":"crossref","unstructured":"Cimpoi, M.; Maji, S.; Kokkinos, I.; Mohamed, S.; Vedaldi, A. Describing textures in the wild. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 3606\u20133613, 2014.","DOI":"10.1109\/CVPR.2014.461"},{"key":"331_CR22","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"364","DOI":"10.1007\/978-3-642-40602-7_39","volume-title":"Pattern Recognition. GCPR 2013","author":"R Tyle\u010dek","year":"2013","unstructured":"Tyle\u010dek, R.; \u0160\u00e1ra, R. Spatial pattern templates for recognition of objects with regular structure. In: Pattern Recognition. GCPR 2013. Lecture Notes in Computer Science, Vol. 8142. Weickert, J.; Hein, M.; Schiele, B. Eds. Springer Berlin Heidelberg, 364\u2013374, 2013."},{"issue":"1","key":"331_CR23","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1007\/s41095-016-0064-2","volume":"3","author":"C Barnes","year":"2017","unstructured":"Barnes, C.; Zhang, F. L. A survey of the state-of-the-art in patch-based synthesis. Computational Visual Media Vol. 3, No. 1, 3\u201320, 2017.","journal-title":"Computational Visual Media"},{"key":"331_CR24","series-title":"Lecture Notes in Biomathematics","doi-asserted-by":"publisher","first-page":"267","DOI":"10.1007\/978-3-642-46466-9_18","volume-title":"Competition and Cooperation in Neural Nets","author":"K Fukushima","year":"1982","unstructured":"Fukushima, K.; Miyake, S. Neocognitron: A self-organizing neural network model for a mechanism of visual pattern recognition. In: Competition and Cooperation in Neural Nets. Lecture Notes in Biomathematics, Vol. 45. Amari, S.; Arbib, M. A. Eds. Springer Berlin Heidelberg, 267\u2013285, 1982."},{"issue":"4","key":"331_CR25","doi-asserted-by":"publisher","first-page":"541","DOI":"10.1162\/neco.1989.1.4.541","volume":"1","author":"Y LeCun","year":"1989","unstructured":"LeCun, Y.; Boser, B.; Denker, J. S.; Henderson, D.; Howard, R. E.; Hubbard, W.; Jackel, L. D. Backpropagation applied to handwritten zip code recognition. Neural Computation Vol. 1, No. 4, 541\u2013551, 1989.","journal-title":"Neural Computation"},{"key":"331_CR26","doi-asserted-by":"crossref","unstructured":"Peng, J. L.; Liu, D.; Xu, S. C.; Li, H. Q. Generating diverse structure for image inpainting with hierarchical VQ-VAE. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 10770\u201310779, 2021.","DOI":"10.1109\/CVPR46437.2021.01063"},{"key":"331_CR27","unstructured":"Vahdat, A; Kautz, J. NVAE: A deep hierarchical variational autoencoder. In: Proceedings of the 34th International Conference on Neural Information Processing Systems, Article No. 1650, 19667\u201319679, 2020."},{"key":"331_CR28","unstructured":"Ramesh, A.; Pavlov, M.; Goh, G.; Gray, S.; Voss, C.; Radford, A.; Chen, M.; Sutskever, I. Zero-shot text-to-image generation. In: Proceedings of the 38th International Conference on Machine Learning, Vol. 139, 8821\u20138831, 2021."},{"key":"331_CR29","unstructured":"Bowman, S. R.; Vilnis, L.; Vinyals, O.; Dai, A. M.; Jozefowicz, R.; Bengio, S. Generating sentences from a continuous space. arXiv preprint arXiv:1511.06349.2015."},{"issue":"7883","key":"331_CR30","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1038\/s41586-021-04043-8","volume":"599","author":"J Frazer","year":"2021","unstructured":"Frazer, J.; Notin, P.; Dias, M.; Gomez, A.; Min, J. K.; Brock, K.; Gal, Y.; Marks, D. S. Disease variant prediction with deep generative models of evolutionary data. Nature Vol. 599, No. 7883, 91\u201395, 2021.","journal-title":"Nature"},{"key":"331_CR31","unstructured":"Salimans, T.; Kingma, D. P.; Welling, M. Markov Chain Monte Carlo and variational inference: Bridging the gap. In: Proceedings of the 32nd International Conference on International Conference on Machine Learning, Vol. 37, 1218\u20131226, 2015."},{"key":"331_CR32","unstructured":"Rezende, D. J.; Mohamed, S.; Wierstra, D. Stochastic backpropagation and approximate inference in deep generative models. In: Proceedings of the 31st International Conference on International Conference on Machine Learning, Vol. 32, II-1278\u2013II-1286, 2014."},{"key":"331_CR33","unstructured":"Kulkarni, T. D.; Whitney, W. F.; Kohli, P.; Tenenbaum, J. B. Deep convolutional inverse graphics network. In: Proceedings of the 28th International Conference on Neural Information Processing Systems, 2539\u20132547, 2015."},{"issue":"3","key":"331_CR34","doi-asserted-by":"publisher","first-page":"363","DOI":"10.1007\/s41095-021-0219-7","volume":"7","author":"R Q Sun","year":"2021","unstructured":"Sun, R. Q.; Huang, C.; Zhu, H. L.; Ma, L. Z. Maskaware photorealistic facial attribute manipulation. Computational Visual Media Vol. 7, No. 3, 363\u2013374, 2021.","journal-title":"Computational Visual Media"},{"key":"331_CR35","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"835","DOI":"10.1007\/978-3-319-46478-7_51","volume-title":"Computer Vision\u2013ECCV 2016","author":"J Walker","year":"2016","unstructured":"Walker, J.; Doersch, C.; Gupta, A.; Hebert, M. An uncertain future: Forecasting from static images using variational autoencoders. In: Computer Vision\u2013ECCV 2016. Lecture Notes in Computer Science, Vol. 9911. Leibe, B.; Matas, J.; Sebe, N.; Welling, M. Eds. Springer Cham, 835\u2013851, 2016."},{"key":"331_CR36","unstructured":"Sohn, K.; Yan, X. C.; Lee, H. Learning structured output representation using deep conditional generative models. In: Proceedings of the 28th International Conference on Neural Information Processing Systems, Vol. 2, 3483\u20133491, 2015."},{"key":"331_CR37","doi-asserted-by":"publisher","first-page":"3665","DOI":"10.1109\/TIP.2020.2964429","volume":"29","author":"R Gao","year":"2020","unstructured":"Gao, R.; Hou, X. S.; Qin, J.; Chen, J. X.; Liu, L.; Zhu, F.; Zhang, Z.; Shao, L. Zero-VAE-GAN: Generating unseen features for generalized and transductive zero-shot learning. IEEE Transactions on Image Processing Vol. 29, 3665\u20133680, 2020.","journal-title":"IEEE Transactions on Image Processing"},{"key":"331_CR38","doi-asserted-by":"crossref","unstructured":"Zheng, C. X.; Cham, T. J.; Cai, J. F. Pluralistic image completion. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 1438\u20131447, 2019.","DOI":"10.1109\/CVPR.2019.00153"},{"key":"331_CR39","unstructured":"Gonzalez, R. C.; Woods, R. E. Digital Image Processing, 4th edn. Pearson, 2018."},{"key":"331_CR40","unstructured":"Lim, J. H.; Ye, J. C. Geometric GAN. arXiv preprint arXiv:1705.02894, 2017."},{"key":"331_CR41","series-title":"International Series in Operations Research & Management Science","doi-asserted-by":"publisher","first-page":"105","DOI":"10.1007\/978-1-4939-1384-8_5","volume-title":"Handbook of Simulation Optimization","author":"M C Fu","year":"2015","unstructured":"Fu, M. C. Stochastic gradient estimation. In: Handbook of Simulation Optimization. International Series in Operations Research & Management Science, Vol. 216. Fu, M. Ed. Springer New York, 105\u2013147, 2015."},{"key":"331_CR42","doi-asserted-by":"crossref","unstructured":"Devroye, L. Sample-based non-uniform random variate generation. In: Proceedings of the 18th Conference on Winter Simulation, 260\u2013265, 1986.","DOI":"10.1145\/318242.318443"},{"key":"331_CR43","unstructured":"Doersch, C. Tutorial on variational autoencoders. arXiv preprint arXiv:1606.05908, 2016."},{"key":"331_CR44","doi-asserted-by":"crossref","unstructured":"Iizuka, S.; Simo-Serra, E.; Ishikawa, H. Globally and locally consistent image completion. ACM Transactions on Graphics Vol. 36, No. 4, Article No. 107, 2017.","DOI":"10.1145\/3072959.3073659"},{"key":"331_CR45","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"89","DOI":"10.1007\/978-3-030-01252-6_6","volume-title":"Computer Vision\u2013ECCV 2018","author":"G L Liu","year":"2018","unstructured":"Liu, G. L.; Reda, F. A.; Shih, K. J.; Wang, T. C.; Tao, A.; Catanzaro, B. Image inpainting for irregular holes using partial convolutions. In: Computer Vision\u2013ECCV 2018. Lecture Notes in Computer Science, Vol. 11215. Ferrari, V.; Hebert, M.; Sminchisescu, C.; Weiss, Y. Eds. Springer Cham, 89\u2013105, 2018."},{"key":"331_CR46","doi-asserted-by":"crossref","unstructured":"Yu, J. H.; Lin, Z.; Yang, J. M.; Shen, X. H.; Lu, X.; Huang, T. Free-form image inpainting with gated convolution. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 4470\u20134479, 2019.","DOI":"10.1109\/ICCV.2019.00457"},{"issue":"3","key":"331_CR47","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1007\/BF00994018","volume":"20","author":"C Cortes","year":"1995","unstructured":"Cortes, C.; Vapnik, V. Support-vector networks. Machine Learning Vol. 20, No. 3, 273\u2013297, 1995.","journal-title":"Machine Learning"},{"key":"331_CR48","unstructured":"Wang, Z.; Simoncelli, E. P.; Bovik, A. C. Multiscale structural similarity for image quality assessment. In: Proceedings of the 37th Asilomar Conference on Signals, Systems & Computers, 1398\u20131402, 2003."},{"key":"331_CR49","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-84882-935-0","volume-title":"Computer Vision: Algorithms and Applications","author":"R Szeliski","year":"2011","unstructured":"Szeliski, R. Computer Vision: Algorithms and Applications. Springer London, 2011."},{"key":"331_CR50","unstructured":"Heusel, M.; Ramsauer, H.; Unterthiner, T.; Nessler, B.; Hochreiter, S. GANs trained by a two time-scale update rule converge to a local Nash equilibrium. In: Proceedings of the 31st International Conference on Neural Information Processing Systems, 6629\u20136640, 2017."}],"container-title":["Computational Visual Media"],"original-title":[],"link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41095-022-0331-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s41095-022-0331-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41095-022-0331-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"},{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10750449\/10897724\/10897735.pdf?arnumber=10897735","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,25]],"date-time":"2025-06-25T18:22:01Z","timestamp":1750875721000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10897735\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,12]]},"references-count":50,"journal-issue":{"issue":"4"},"URL":"https:\/\/doi.org\/10.1007\/s41095-022-0331-3","relation":{},"ISSN":["2096-0662","2096-0433"],"issn-type":[{"value":"2096-0662","type":"electronic"},{"value":"2096-0433","type":"print"}],"subject":[],"published":{"date-parts":[[2023,12]]},"assertion":[{"value":"2 May 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 December 2022","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 July 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declaration of competing interest"}}]}}