{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,16]],"date-time":"2026-05-16T16:13:20Z","timestamp":1778948000256,"version":"3.51.4"},"reference-count":274,"publisher":"Springer Science and Business Media LLC","issue":"7","license":[{"start":{"date-parts":[[2024,1,19]],"date-time":"2024-01-19T00:00:00Z","timestamp":1705622400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,19]],"date-time":"2024-01-19T00:00:00Z","timestamp":1705622400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2024,7]]},"DOI":"10.1007\/s11263-023-01977-6","type":"journal-article","created":{"date-parts":[[2024,1,19]],"date-time":"2024-01-19T13:02:19Z","timestamp":1705669339000},"page":"2367-2400","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":67,"title":["Deep Learning-Based Image and Video Inpainting: A Survey"],"prefix":"10.1007","volume":"132","author":[{"given":"Weize","family":"Quan","sequence":"first","affiliation":[]},{"given":"Jiaxi","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Yanli","family":"Liu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2209-2404","authenticated-orcid":false,"given":"Dong-Ming","family":"Yan","sequence":"additional","affiliation":[]},{"given":"Peter","family":"Wonka","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,1,19]]},"reference":[{"key":"1977_CR1","first-page":"214","volume":"70","author":"M Arjovsky","year":"2017","unstructured":"Arjovsky, M., Chintala, S., & Bottou, L. (2017). Wasserstein Generative Adversarial Networks. Int. Conf. Mach. Learn.,70, 214\u2013223.","journal-title":"International Conference on Machine Learning"},{"key":"1977_CR2","first-page":"17981","volume":"34","author":"J Austin","year":"2021","unstructured":"Austin, J., Johnson, D. D., Ho, J., Tarlow, D., & van den Berg, R. (2021). Structured Denoising Diffusion Models in Discrete State-Spaces. Adv. Neural Inform. Process. Syst.,34, 17981\u201317993.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"1977_CR3","doi-asserted-by":"crossref","unstructured":"Avrahami, O., Lischinski, D., & Fried, O. (2022). Blended Diffusion for Text-Driven Editing of Natural Images. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 18208-18218).","DOI":"10.1109\/CVPR52688.2022.01767"},{"issue":"8","key":"1977_CR4","doi-asserted-by":"publisher","first-page":"1200","DOI":"10.1109\/83.935036","volume":"10","author":"C Ballester","year":"2001","unstructured":"Ballester, C., Bertalmio, M., Caselles, V., Sapiro, G., & Verdera, J. (2001). Filling-in by joint interpolation of vector fields and gray levels. IEEE Trans Image Process, 10(8), 1200\u20131211.","journal-title":"IEEE Transactions on Image Processing"},{"key":"1977_CR5","doi-asserted-by":"crossref","unstructured":"Baluja, S., Marwood, D., Johnston, N., Covell, M. (2019). Learning to render better image previews. In I2019 IEEE International Conference on Image Processing (ICIP), (pp. 1700-1704). IEEE.","DOI":"10.1109\/ICIP.2019.8803147"},{"issue":"3","key":"1977_CR6","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1145\/1531326.1531330","volume":"28","author":"C Barnes","year":"2009","unstructured":"Barnes, C., Shechtman, E., Finkelstein, A., & Goldman, D. B. (2009). PatchMatch: A randomized correspondence algorithm for structural image editing. ACM Trans Graph, 28(3), 24.","journal-title":"ACM Trans Graph"},{"key":"1977_CR7","doi-asserted-by":"crossref","unstructured":"Bertalmio, M., Sapiro, G., Caselles, V., & Ballester, C. (2000). Image inpainting. In Proceedings ACM SIGGRAPH, pp. 417\u2013424","DOI":"10.1145\/344779.344972"},{"key":"1977_CR8","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1007\/s41095-021-0242-8","volume":"8","author":"X Bian","year":"2022","unstructured":"Bian, X., Wang, C., Quan, W., Ye, J., Zhang, X., & Yan, D. M. (2022). Scene text removal via cascaded text stroke detection and erasing. Computational Visual Media, 8, 273\u2013287.","journal-title":"Computational Visual Media"},{"key":"1977_CR9","doi-asserted-by":"crossref","unstructured":"Blau, Y., & Michaeli, T. (2018). The perception-distortion tradeoff. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 6228-6237).","DOI":"10.1109\/CVPR.2018.00652"},{"key":"1977_CR10","doi-asserted-by":"publisher","first-page":"679","DOI":"10.1109\/TPAMI.1986.4767851","volume":"6","author":"J Canny","year":"1986","unstructured":"Canny, J. (1986). A computational approach to edge detection. IEEE Trans Pattern Anal Mach Intell, 6, 679\u2013698.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1977_CR11","doi-asserted-by":"crossref","unstructured":"Cao, C., & Fu, Y. (2021). Learning a sketch tensor space for image inpainting of man-made scenes. In Proceedings of the IEEE\/CVF international conference on computer vision, (pp. 14509\u201314518)","DOI":"10.1109\/ICCV48922.2021.01424"},{"key":"1977_CR12","doi-asserted-by":"crossref","unstructured":"Cao, C., Dong, Q., Fu, Y. (2022). Learning prior feature and attention enhanced image inpainting. In European conference on computer vision","DOI":"10.1007\/978-3-031-19784-0_18"},{"issue":"1","key":"1977_CR13","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1016\/0165-1684(88)90028-X","volume":"15","author":"S Carlsson","year":"1988","unstructured":"Carlsson, S. (1988). Sketch based coding of grey level images. Sign Process, 15(1), 57\u201383.","journal-title":"Sign Process"},{"key":"1977_CR14","doi-asserted-by":"crossref","unstructured":"Carreira, J., Zisserman, A. (2017). Quo vadis, action recognition? A new model and the kinetics dataset. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 4724\u20134733)","DOI":"10.1109\/CVPR.2017.502"},{"key":"1977_CR15","doi-asserted-by":"crossref","unstructured":"Chang, Y. L, Liu, Z. Y., Lee, K. Y., & Hsu, W. (2019a). Free-form video inpainting with 3d gated convolution and temporal patchgan. In International conference on computer vision, (pp. 9066\u20139075)","DOI":"10.1109\/ICCV.2019.00916"},{"key":"1977_CR16","unstructured":"Chang, Y. L., Liu, Z. Y., Lee, K. Y., & Hsu, W. (2019b). Learnable gated temporal shift module for deep video inpainting. In The British Machine vision conference"},{"key":"1977_CR17","doi-asserted-by":"crossref","unstructured":"Chang, Y. L., Yu Liu, Z., & Hsu, W. (2019). Vornet: Spatio-temporally consistent video inpainting for object removal. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition workshops","DOI":"10.1109\/CVPRW.2019.00229"},{"key":"1977_CR18","doi-asserted-by":"crossref","unstructured":"Chen, C., Cai, J., Hu, Y., Tang, X., Wang, X., Yuan, C., & Bai, S. (2021). Deep interactive video inpainting: An invisibility cloak for harry potter. In Proceedings of the 29th ACM international conference on multimedia (pp. 862-870).","DOI":"10.1145\/3474085.3475262"},{"key":"1977_CR19","doi-asserted-by":"crossref","unstructured":"Chen, L., Zhang, H., Xiao, J., Nie, L., Shao, J., Liu, W., & Chua, T. S. (2017). Sca-cnn: Spatial and channel-wise attention in convolutional networks for image captioning. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 5659-5667).","DOI":"10.1109\/CVPR.2017.667"},{"key":"1977_CR20","unstructured":"Chen, P. (2018). Video retouch: Object removal. http:\/\/www.12371.cn\/2021\/02\/08\/ARTI1612745858192472.shtml"},{"key":"1977_CR21","unstructured":"Chen, T., Lucic, M., Houlsby, N., & Gelly, S. (2018). On self modulation for generative adversarial networks. In International conference on learning representations"},{"key":"1977_CR22","first-page":"4479","volume":"33","author":"L Chi","year":"2020","unstructured":"Chi, L., Jiang, B., & Mu, Y. (2020). Fast Fourier Convolution. Adv. Neural Inform. Process. Syst., 33, 4479\u20134488.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"1977_CR23","unstructured":"Chu, P., Quan, W., Wang, T., Wang, P., Ren, P., & Yan23, D. M. (2021). Deep Video Decaptioning. In Proceedings of the British machine vision conference"},{"key":"1977_CR24","doi-asserted-by":"crossref","unstructured":"Chung, H., Sim, B., & Ye, J. C. (2022). Come-closer-diffuse-faster: Accelerating conditional diffusion models for inverse problems through stochastic contraction. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 12413-12422).","DOI":"10.1109\/CVPR52688.2022.01209"},{"key":"1977_CR25","doi-asserted-by":"crossref","unstructured":"Cimpoi, M., Maji, S., Kokkinos, I., Mohamed, S., & Vedaldi, A. (2014). Describing textures in the wild. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 3606-3613).","DOI":"10.1109\/CVPR.2014.461"},{"issue":"9","key":"1977_CR26","doi-asserted-by":"publisher","first-page":"1200","DOI":"10.1109\/TIP.2004.833105","volume":"13","author":"A Criminisi","year":"2004","unstructured":"Criminisi, A., Perez, P., & Toyama, K. (2004). Region filling and object removal by exemplar-based image inpainting. IEEE Trans Image Process, 13(9), 1200\u20131212.","journal-title":"IEEE Transactions on Image Processing"},{"issue":"9","key":"1977_CR27","doi-asserted-by":"publisher","first-page":"10850","DOI":"10.1109\/TPAMI.2023.3261988","volume":"45","author":"FA Croitoru","year":"2023","unstructured":"Croitoru, F. A., Hondru, V., Ionescu, R. T., & Shah, M. (2023). Diffusion models in vision: A survey. IEEE Trans Pattern Anal Mach Intell, 45(9), 10850\u201310869.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"10","key":"1977_CR28","doi-asserted-by":"publisher","first-page":"2564","DOI":"10.1109\/TMM.2019.2958760","volume":"22","author":"Q Dai","year":"2020","unstructured":"Dai, Q., Chopp, H., Pouyet, E., Cossairt, O., Walton, M., & Katsaggelos, A. K. (2020). Adaptive image sampling using deep learning and its application on x-ray fluorescence image reconstruction. IEEE Trans Multimedia, 22(10), 2564\u20132578.","journal-title":"IEEE Transactions on Multimedia"},{"issue":"4","key":"1977_CR29","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2185520.2185578","volume":"31","author":"S Darabi","year":"2012","unstructured":"Darabi, S., Shechtman, E., Barnes, C., Goldman, D. B., & Sen, P. (2012). Image Melding: combining inconsistent images using patch-based synthesis. ACM Trans Graph (Proc SIGGRAPH), 31(4), 1\u201310.","journal-title":"ACM Trans Graph (Proc SIGGRAPH)"},{"issue":"5","key":"1977_CR30","doi-asserted-by":"publisher","first-page":"961","DOI":"10.1109\/18.57199","volume":"36","author":"I Daubechies","year":"1990","unstructured":"Daubechies, I. (1990). The wavelet transform, time-frequency localization and signal analysis. IEEE Trans Inf Theory, 36(5), 961\u20131005.","journal-title":"IEEE Transactions on Information Theory"},{"key":"1977_CR31","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L. J., Li, K., & Fei-Fei, L. (2009). Imagenet: A large-scale hierarchical image database. In 2009 IEEE conference on computer vision and pattern recognition (pp. 248-255). IEEE.","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"1977_CR32","doi-asserted-by":"crossref","unstructured":"Deng, Y., Tang, F., Dong, W., Sun, W., Huang, F., & Xu, C. (2020). Arbitrary style transfer via multi-adaptation network. In Proceedings of the 28th ACM international conference on multimedia (pp. 2719-2727).","DOI":"10.1145\/3394171.3414015"},{"key":"1977_CR33","doi-asserted-by":"crossref","unstructured":"Deng, Y., Hui, S., Zhou, S., Meng, D., & Wang, J. (2021). Learning contextual transformer network for image inpainting. In Proceedings of the 29th ACM international conference on multimedia (pp. 2529-2538).","DOI":"10.1145\/3474085.3475426"},{"key":"1977_CR34","doi-asserted-by":"crossref","unstructured":"Deng, Y., Hui, S., Meng, R., Zhou, S., & Wang, J. (2022). Hourglass attention network for image inpainting. In European conference on computer vision (pp. 483-501). Springer Nature Switzerland.","DOI":"10.1007\/978-3-031-19797-0_28"},{"key":"1977_CR35","unstructured":"Dinh, L., Krueger, D., & Bengio, Y. (2014). Nice: Non-linear independent components estimation. In Int Conf Learn Represent Worksh"},{"issue":"4","key":"1977_CR36","doi-asserted-by":"publisher","first-page":"101","DOI":"10.1145\/2185520.2185597","volume":"31","author":"C Doersch","year":"2012","unstructured":"Doersch, C., Singh, S., Gupta, A., Sivic, J., & Efros, A. A. (2012). What makes paris look like paris? ACM Transactions on Graphics, 31(4), 101.","journal-title":"ACM Transactions on Graphics"},{"key":"1977_CR37","doi-asserted-by":"crossref","unstructured":"Dolhansky, B., & Ferrer, C. C. (2018). Eye in-painting with exemplar generative adversarial networks. In Proceedings of the IEEE conference on computer vision and pattern recognition\" (pp. 7902-7911).","DOI":"10.1109\/CVPR.2018.00824"},{"key":"1977_CR38","doi-asserted-by":"crossref","unstructured":"Dong, Q., Cao, C., & Fu, Y. (2022). Incremental transformer structure enhanced image inpainting with masking positional encoding. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 11358-11368).","DOI":"10.1109\/CVPR52688.2022.01107"},{"key":"1977_CR39","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., Weissenborn, D., Zhai, X., Unterthiner, T., & Houlsby, N. (2020). An image is worth 16x16 words: Transformers for image recognition at scale. In International conference on learning representations"},{"key":"1977_CR40","doi-asserted-by":"publisher","first-page":"81","DOI":"10.1007\/s11760-009-0144-1","volume":"5","author":"R Dosselmann","year":"2011","unstructured":"Dosselmann, R., & Yang, X. D. (2011). A comprehensive assessment of the structural similarity index. Sign Image and Video Process, 5, 81\u201391.","journal-title":"Sign Image and Video Process"},{"key":"1977_CR41","first-page":"1033","volume":"2","author":"A Efros","year":"1999","unstructured":"Efros, A., & Leung, T. (1999). Texture synthesis by non-parametric sampling. Int. Conf. Comput. Vis., 2, 1033\u20131038.","journal-title":"International Conference on Computer Vision"},{"issue":"2","key":"1977_CR42","doi-asserted-by":"publisher","first-page":"2007","DOI":"10.1007\/s11063-019-10163-0","volume":"51","author":"O Elharrouss","year":"2020","unstructured":"Elharrouss, O., Almaadeed, N., Al-Maadeed, S., & Akbari, Y. (2020). Image Inpainting: A Review. Neural Process Letters, 51(2), 2007\u20132028.","journal-title":"Neural Process Letters"},{"key":"1977_CR43","first-page":"3518","volume":"34","author":"P Esser","year":"2021","unstructured":"Esser, P., Rombach, R., Blattmann, A., & Ommer, B. (2021). ImageBART: Bidirectional Context with Multinomial Diffusion for Autoregressive Image Synthesis. Adv. Neural Inform. Process. Syst., 34, 3518\u20133532.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"1977_CR44","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1007\/s11263-014-0733-5","volume":"111","author":"M Everingham","year":"2015","unstructured":"Everingham, M., Eslami, S. M. A., Gool, L. V., Williams, C. K. I., Winn, J., & Zisserman, A. (2015). The pascal visual object classes challenge: A retrospective. Int J Comput Vis, 111, 98\u2013136.","journal-title":"International Journal of Computer Vision"},{"key":"1977_CR45","doi-asserted-by":"publisher","first-page":"167","DOI":"10.1023\/B:VISI.0000022288.19776.77","volume":"59","author":"PF Felzenszwalb","year":"2004","unstructured":"Felzenszwalb, P. F., & Huttenlocher, D. P. (2004). Efficient graph-based image segmentation. Int J Comput Vis, 59, 167\u2013181.","journal-title":"International Journal of Computer Vision"},{"issue":"11","key":"1977_CR46","doi-asserted-by":"publisher","first-page":"7432","DOI":"10.1109\/TCSVT.2022.3188169","volume":"32","author":"X Feng","year":"2022","unstructured":"Feng, X., Pei, W., Li, F., Chen, F., Zhang, D., & Lu, G. (2022). Generative memory-guided semantic reasoning model for image inpainting. IEEE Trans Circuit Syst Video Technol, 32(11), 7432\u20137447.","journal-title":"IEEE Transactions on Circuits and Systems for Video Technology"},{"key":"1977_CR47","doi-asserted-by":"crossref","unstructured":"Fu, J., Liu, J., Tian, H., Li, Y., Bao, Y., Fang, Z., & Lu, H. (2019). Dual attention network for scene segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 3146-3154).","DOI":"10.1109\/CVPR.2019.00326"},{"key":"1977_CR48","doi-asserted-by":"publisher","first-page":"255","DOI":"10.1007\/s10851-008-0087-0","volume":"31","author":"I Gali\u0107","year":"2008","unstructured":"Gali\u0107, I., Weickert, J., Welk, M., Bruhn, A., Belyaev, A., & Seidel, H. P. (2008). Image compression with anisotropic diffusion. J Math Imaging Vis, 31, 255\u2013269.","journal-title":"Journal of Mathematical Imaging and Vision"},{"key":"1977_CR49","doi-asserted-by":"crossref","unstructured":"Gao, C., Saraf, A., Huang, J. B., & Kopf, J. (2020). Flow-edge guided video completion. In Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XII 16 (pp. 713-729).","DOI":"10.1007\/978-3-030-58610-2_42"},{"key":"1977_CR50","doi-asserted-by":"crossref","unstructured":"Gatys, L. A., Ecker, A. S., & Bethge, M. (2016). Image style transfer using convolutional neural networks. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 2414-2423).","DOI":"10.1109\/CVPR.2016.265"},{"key":"1977_CR51","unstructured":"Goodfellow, I., Pouget-Abadie, J., Mirza, M., Xu, B., Warde-Farley, D., Ozair, S., & Bengio, Y. (2014). Generative adversarial nets. Advances in Neural Information Processing Systems, 27"},{"key":"1977_CR52","doi-asserted-by":"crossref","unstructured":"Granados, M., Kim, K. I., Tompkin, J., Kautz, J., & Theobalt, C. (2012). Background inpainting for videos with dynamic objects and a free-moving camera. In Computer Vision-ECCV 2012: 12th European Conference on Computer Vision, Florence, Italy, October 7-13, 2012, Proceedings, Part I 12 (pp. 682-695).","DOI":"10.1007\/978-3-642-33718-5_49"},{"key":"1977_CR53","doi-asserted-by":"crossref","unstructured":"Gu, J., Shen, Y., & Zhou, B. (2020). Image processing using multi-code gan prior. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 3012-3021).","DOI":"10.1109\/CVPR42600.2020.00308"},{"issue":"1","key":"1977_CR54","doi-asserted-by":"publisher","first-page":"127","DOI":"10.1109\/MSP.2013.2273004","volume":"31","author":"C Guillemot","year":"2014","unstructured":"Guillemot, C., & Meur, O. L. (2014). Image inpainting: Overview and recent advances. IEEE Sign Process Magazine, 31(1), 127\u2013144.","journal-title":"IEEE Sign Process Magazine"},{"issue":"6","key":"1977_CR55","doi-asserted-by":"publisher","first-page":"2023","DOI":"10.1109\/TVCG.2017.2702738","volume":"24","author":"Q Guo","year":"2018","unstructured":"Guo, Q., Gao, S., Zhang, X., Yin, Y., & Zhang, C. (2018). Patch-based image inpainting via two-stage low rank approximation. IEEE Trans Vis Comput Graph, 24(6), 2023\u20132036.","journal-title":"IEEE Transactions on Visualization and Computer Graphics"},{"key":"1977_CR56","doi-asserted-by":"crossref","unstructured":"Guo, X., Yang, H., & Huang, D. (2021). Image inpainting via conditional texture and structure dual generation. In Proceedings of the IEEE\/CVF International Conference on Computer Vision (pp. 14134-14143).","DOI":"10.1109\/ICCV48922.2021.01387"},{"key":"1977_CR57","doi-asserted-by":"crossref","unstructured":"Guo, Z., Chen, Z., Yu, T., Chen, J., & Liu, S. (2019). Progressive image inpainting with full-resolution residual network. In Proceedings of the 27th ACM international conference on multimedia (pp. 2496-2504).","DOI":"10.1145\/3343031.3351022"},{"key":"1977_CR58","doi-asserted-by":"publisher","first-page":"190","DOI":"10.1109\/LSP.2020.3048608","volume":"28","author":"C Han","year":"2021","unstructured":"Han, C., & Wang, J. (2021). Face image inpainting with evolutionary generators. IEEE Sign Process Letters, 28, 190\u2013193.","journal-title":"IEEE Sign Process Letters"},{"key":"1977_CR59","doi-asserted-by":"crossref","unstructured":"Han, X., Wu, Z., Huang, W., Scott, M. R., & Davis, L. S. (2019). Finet: Compatible and diverse fashion image inpainting. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 4481-4491).","DOI":"10.1109\/ICCV.2019.00458"},{"key":"1977_CR60","doi-asserted-by":"crossref","unstructured":"He, K., & Sun, J. (2012). Statistics of patch offsets for image completion. In Computer Vision-ECCV 2012: 12th European conference on computer vision, Florence, Italy, October 7-13, 2012, Proceedings, Part II 12 (pp. 16-29).","DOI":"10.1007\/978-3-642-33709-3_2"},{"key":"1977_CR61","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. (2016). Deep residual learning for image recognition. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 770-778).","DOI":"10.1109\/CVPR.2016.90"},{"key":"1977_CR62","doi-asserted-by":"crossref","unstructured":"He, K., Chen, X., Xie, S., Li, Y., Doll\u00e1r, P., & Girshick, R. (2022). Masked autoencoders are scalable vision learners. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 16000-16009).","DOI":"10.1109\/CVPR52688.2022.01553"},{"issue":"6","key":"1977_CR63","doi-asserted-by":"publisher","first-page":"866","DOI":"10.1109\/TVCG.2014.2298016","volume":"20","author":"J Herling","year":"2014","unstructured":"Herling, J., & Broll, W. (2014). High-quality real-time video inpainting with pixmix. IEEE Trans Vis Comput Graph, 20(6), 866\u2013879.","journal-title":"IEEE Transactions on Visualization and Computer Graphics"},{"key":"1977_CR64","unstructured":"Hertz, A., Mokady, R., Tenenbaum, J., Aberman, K., Pritch, Y,. & Cohen-Or, D. (2022). Prompt-to-prompt image editing with cross attention control. arXiv preprint arXiv:2208.01626"},{"key":"1977_CR65","first-page":"6626","volume":"30","author":"M Heusel","year":"2017","unstructured":"Heusel M, Ramsauer H, Unterthiner T, Nessler B, Hochreiter S (2017) Gans trained by a two time-scale update rule converge to a local nash equilibrium. Advances in neural information processing systems, 30: 6626\u20136637","journal-title":"Advances in Neural Information Processing Systems"},{"key":"1977_CR66","first-page":"6840","volume":"33","author":"J Ho","year":"2020","unstructured":"Ho, J., Jain, A., & Abbeel, P. (2020). Denoising Diffusion Probabilistic Models. Adv. Neural Inform. Process. Syst., 33, 6840\u20136851.","journal-title":"Advances in Neural Information Processing Systems"},{"issue":"8","key":"1977_CR67","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S., & Schmidhuber, J. (1997). Long short-term memory. Neural Comput, 9(8), 1735\u20131780.","journal-title":"Neural Computation"},{"key":"1977_CR68","doi-asserted-by":"crossref","unstructured":"Hong, X., Xiong, P., Ji, R., & Fan, H. (2019). Deep fusion network for image completion. In Proceedings of the 27th ACM international conference on multimedia (pp. 2033-2042).","DOI":"10.1145\/3343031.3351002"},{"key":"1977_CR69","first-page":"12454","volume":"34","author":"E Hoogeboom","year":"2021","unstructured":"Hoogeboom, E., Nielsen, D., Jaini, P., Forr\u00e9, P., & Welling, M. (2021). Argmax Flows and Multinomial Diffusion: Learning Categorical Distributions. Adv. Neural Inform. Process. Syst., 34, 12454\u201312465.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"1977_CR70","doi-asserted-by":"crossref","unstructured":"Houle, M. E. (2017). Local intrinsic dimensionality I: an extreme-value-theoretic foundation for similarity applications. In Similarity search and applications: 10th international conference, SISAP 2017, Munich, Germany, October 4-6, 2017, Proceedings 10 (pp. 64-79). Springer International Publishing.","DOI":"10.1007\/978-3-319-68474-1_5"},{"key":"1977_CR71","doi-asserted-by":"crossref","unstructured":"Houle, M. E. (2017). Local intrinsic dimensionality II: multivariate analysis and distributional support. In Similarity Search and Applications: 10th International Conference, SISAP 2017, Munich, Germany, October 4-6, 2017, Proceedings 10 (pp. 80-95). Springer International Publishing.","DOI":"10.1007\/978-3-319-68474-1_6"},{"key":"1977_CR72","doi-asserted-by":"crossref","unstructured":"Hu, J., Shen, L., & Sun, G. (2018). Squeeze-and-excitation networks. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 7132-7141).","DOI":"10.1109\/CVPR.2018.00745"},{"key":"1977_CR73","doi-asserted-by":"crossref","unstructured":"Hu, Y. T., Wang, H., Ballas, N., Grauman, K., & Schwing, A. G. (2020). Proposal-based video completion. In Computer Vision-ECCV 2020: 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part XXVII 16 (pp. 38-54). Springer International Publishing.","DOI":"10.1007\/978-3-030-58583-9_3"},{"issue":"4","key":"1977_CR74","first-page":"1","volume":"33","author":"JB Huang","year":"2014","unstructured":"Huang, J. B., Kang, S. B., Ahuja, N., & Kopf, J. (2014). Image completion using planar structure guidance. ACM Transactions on Graphics (Proc SIGGRAPH), 33(4), 1\u201310.","journal-title":"ACM Transactions on Graphics"},{"issue":"6","key":"1977_CR75","first-page":"1","volume":"35","author":"JB Huang","year":"2016","unstructured":"Huang, J. B., Kang, S. B., Ahuja, N., & Kopf, J. (2016). Temporally coherent completion of dynamic video. ACM Trans Graph, 35(6), 1\u201311.","journal-title":"ACM Transactions on Graphics"},{"key":"1977_CR76","doi-asserted-by":"crossref","unstructured":"Huang, X., & Belongie, S. (2017). Arbitrary style transfer in real-time with adaptive instance normalization. In Proceedings of the IEEE international conference on computer vision (pp. 1501-1510).","DOI":"10.1109\/ICCV.2017.167"},{"key":"1977_CR77","unstructured":"Hui, Z., Li, J., Wang, X., & Gao, X. (2020). Image fine-grained inpainting. arXiv preprint arXiv:2002.02609"},{"issue":"4","key":"1977_CR78","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3072959.3073659","volume":"36","author":"S Iizuka","year":"2017","unstructured":"Iizuka, S., Simo-Serra, E., & Ishikawa, H. (2017). Globally and locally consistent image completion. ACM Trans Graph (Proc SIGGRAPH), 36(4), 1\u201314.","journal-title":"ACM Transactions on Graphics"},{"issue":"6","key":"1977_CR79","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1111\/cgf.12518","volume":"34","author":"S Ilan","year":"2015","unstructured":"Ilan, S., & Shamir, A. (2015). A survey on data-driven video completion. Comput Graph Forum, 34(6), 60\u201385.","journal-title":"Computer Graphics Forum"},{"key":"1977_CR80","doi-asserted-by":"crossref","unstructured":"Ilg, E., Mayer, N., Saikia, T., Keuper, M., Dosovitskiy, A., & Brox, T. (2017). Flownet 2.0: Evolution of optical flow estimation with deep networks. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 2462-2470).","DOI":"10.1109\/CVPR.2017.179"},{"key":"1977_CR81","doi-asserted-by":"crossref","unstructured":"Isola, P., Zhu, J. Y., Zhou, T., & Efros, A. A. (2017). Image-to-image translation with conditional adversarial networks. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 1125-1134).","DOI":"10.1109\/CVPR.2017.632"},{"key":"1977_CR82","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2020.103147","volume":"203","author":"J Jam","year":"2021","unstructured":"Jam, J., Kendrick, C., Walker, K., Drouard, V., Hsu, J. G. S., & Yap, M. H. (2021). A comprehensive review of past and present image inpainting methods. Comput Vis Image Understand, 203, 103147.","journal-title":"Computer Vision and Image Understanding"},{"key":"1977_CR83","doi-asserted-by":"crossref","unstructured":"Jiang, L., Dai, B., Wu, W., & Loy, C. C. (2021). Focal frequency loss for image reconstruction and synthesis. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 13919-13929).","DOI":"10.1109\/ICCV48922.2021.01366"},{"key":"1977_CR84","doi-asserted-by":"crossref","unstructured":"Johnson, J., Alahi, A., & Fei-Fei, L. (2016). Perceptual losses for real-time style transfer and super-resolution. In Computer Vision-ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11-14, 2016, Proceedings, Part II 14 (pp. 694-711). Springer International Publishing.","DOI":"10.1007\/978-3-319-46475-6_43"},{"key":"1977_CR85","doi-asserted-by":"crossref","unstructured":"Kang, J., Oh, S. W., & Kim, S. J. (2022). Error compensation framework for flow-guided video inpainting. In European conference on computer vision (pp. 375-390). Cham: Springer Nature Switzerland.","DOI":"10.1007\/978-3-031-19784-0_22"},{"key":"1977_CR86","unstructured":"Karras, T., Aila, T., Laine, S., & Lehtinen, J. (2018). Progressive growing of GANs for improved quality, stability, and variation. International conference on learning representations"},{"key":"1977_CR87","doi-asserted-by":"crossref","unstructured":"Karras, T., Laine, S., & Aila, T. (2019). A style-based generator architecture for generative adversarial networks. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 4401-4410).","DOI":"10.1109\/CVPR.2019.00453"},{"key":"1977_CR88","doi-asserted-by":"crossref","unstructured":"Karras, T., Laine, S., Aittala, M., Hellsten, J., Lehtinen, J., & Aila, T. (2020). Analyzing and improving the image quality of stylegan. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 8110-8119).","DOI":"10.1109\/CVPR42600.2020.00813"},{"key":"1977_CR89","doi-asserted-by":"crossref","unstructured":"Ke L, Tai YW, Tang CK (2021) Occlusion-aware video object inpainting. In: Int. Conf. Comput. Vis., pp 14468\u201314478","DOI":"10.1109\/ICCV48922.2021.01420"},{"key":"1977_CR90","doi-asserted-by":"crossref","unstructured":"Kim, D., Woo, S., Lee, J. Y., & Kweon, I. S. (2019). Deep blind video decaptioning by temporal aggregation and recurrence. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 4263-4272).","DOI":"10.1109\/CVPR.2019.00439"},{"key":"1977_CR91","doi-asserted-by":"crossref","unstructured":"Kim, D., Woo, S., Lee, J.Y., & Kweon, I.S. (2019b). Deep video inpainting. In IEEE conference on computer vision and pattern Recognition (pp. 5792\u20135801)","DOI":"10.1109\/CVPR.2019.00594"},{"key":"1977_CR92","doi-asserted-by":"crossref","unstructured":"Kim, S. Y., Aberman, K., Kanazawa, N., Garg, R., Wadhwa, N., Chang, H., & Liba, O. (2022). Zoom-to-inpaint: Image inpainting with high-frequency details. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 477-487).","DOI":"10.1109\/CVPRW56347.2022.00063"},{"key":"1977_CR93","unstructured":"Kingma, D. P., & Dhariwal, P. (2018). Glow: generative flow with invertible 1x1 convolutions. Advances in Neural Information Processing Systems, 31."},{"key":"1977_CR94","unstructured":"Kingma, D. P., & Welling, M. (2013). Auto-encoding variational bayes. In IEEE conference on computer vision and pattern Recognition."},{"key":"1977_CR95","doi-asserted-by":"crossref","unstructured":"Lai, W. S., Huang, J. B., Wang, O., Shechtman, E., Yumer, E., & Yang, M. H. (2018). Learning blind video temporal consistency. In Proceedings of the European conference on computer vision (ECCV) (pp. 170-185).","DOI":"10.1007\/978-3-030-01267-0_11"},{"key":"1977_CR96","doi-asserted-by":"crossref","unstructured":"Lao, D., Zhu, P., Wonka, P., & Sundaramoorthi, G. (2021). Flow-guided video inpainting with scene templates. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 14599-14608).","DOI":"10.1109\/ICCV48922.2021.01433"},{"key":"1977_CR97","doi-asserted-by":"crossref","unstructured":"Ledig, C., Theis, L., Husz\u00e1ir, F., Caballero, J., Cunningham, A., Acosta, A., & Shi, W. (2017). Photo-realistic single image super-resolution using a generative adversarial network. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 4681-4690).","DOI":"10.1109\/CVPR.2017.19"},{"key":"1977_CR98","doi-asserted-by":"crossref","unstructured":"Lee, S., Oh, S. W., Won, D., & Kim, S. J. (2019). Copy-and-paste networks for deep video inpainting. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 4413-4421).","DOI":"10.1109\/ICCV.2019.00451"},{"key":"1977_CR99","doi-asserted-by":"crossref","unstructured":"Lempitsky, V., Vedaldi, A., & Ulyanov, D. (2018). Deep image prior. IEEE conference on computer vision and pattern recognition (pp. 9446\u20139454)","DOI":"10.1109\/CVPR.2018.00984"},{"key":"1977_CR100","doi-asserted-by":"crossref","unstructured":"Li, A., Qi, J., Zhang, R., Ma, X., & Ramamohanarao, K. (2019). Generative image inpainting with submanifold alignment. In International joint conference on artificial intelligence (pp. 811\u2013817)","DOI":"10.24963\/ijcai.2019\/114"},{"key":"1977_CR101","doi-asserted-by":"crossref","unstructured":"Li, A., Zhao, S., Ma, X., Gong, M., Qi, J., Zhang, R., & Kotagiri, R. (2020). Short-term and long-term context aggregation network for video inpainting. In Computer Vision-ECCV 2020: 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part IV 16 (pp. 728-743). Springer International Publishing.","DOI":"10.1007\/978-3-030-58548-8_42"},{"key":"1977_CR102","doi-asserted-by":"publisher","first-page":"376","DOI":"10.1016\/j.neucom.2022.11.074","volume":"520","author":"A Li","year":"2023","unstructured":"Li, A., Zhao, L., Zuo, Z., Wang, Z., Xing, W., & Lu, D. (2023). Migt: Multi-modal image inpainting guided with text. Neurocomputing, 520, 376\u2013385.","journal-title":"Neurocomputing"},{"key":"1977_CR103","doi-asserted-by":"publisher","DOI":"10.1016\/j.sigpro.2021.108278","volume":"189","author":"B Li","year":"2021","unstructured":"Li, B., Zheng, B., Li, H., & Li, Y. (2021). Detail-enhanced image inpainting based on discrete wavelet transforms. Sign Process, 189, 108278.","journal-title":"Signal Process"},{"key":"1977_CR104","doi-asserted-by":"crossref","unstructured":"Li, C. T., Siu, W. C., Liu, Z. S., Wang, L. W., & Lun, D. P. K. (2020). DeepGIN: Deep generative inpainting network for extreme image inpainting. In Computer Vision-ECCV 2020 Workshops: Glasgow, UK, August 23-28, 2020, Proceedings, Part IV 16 (pp. 5-22). Springer International Publishing.","DOI":"10.1007\/978-3-030-66823-5_1"},{"key":"1977_CR105","doi-asserted-by":"publisher","first-page":"743","DOI":"10.1109\/TCI.2022.3190142","volume":"8","author":"F Li","year":"2022","unstructured":"Li, F., Li, A., Qin, J., Bai, H., Lin, W., Cong, R., & Zhao, Y. (2022). Srinpaintor: When super-resolution meets transformer for image inpainting. IEEE Trans Computational Imaging, 8, 743\u2013758.","journal-title":"IEEE Transactions on Computational Imaging"},{"issue":"12","key":"1977_CR106","doi-asserted-by":"publisher","first-page":"4398","DOI":"10.1109\/TCYB.2018.2865036","volume":"49","author":"H Li","year":"2018","unstructured":"Li, H., Li, G., Lin, L., Yu, H., & Yu, Y. (2018). Context-aware semantic inpainting. IEEE transactions on cybernetics, 49(12), 4398-4411.","journal-title":"IEEE Transactions on Cybernetics"},{"key":"1977_CR107","doi-asserted-by":"crossref","unstructured":"Li, J., He, F., Zhang, L., Du, B., & Tao, D. (2019). Progressive reconstruction of visual structure for image inpainting. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 5962-5971).","DOI":"10.1109\/ICCV.2019.00606"},{"key":"1977_CR108","doi-asserted-by":"crossref","unstructured":"Li, J., Wang, N., Zhang, L., Du, B., & Tao, D. (2020). Recurrent feature reasoning for image inpainting. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 7760-7768).","DOI":"10.1109\/CVPR42600.2020.00778"},{"key":"1977_CR109","doi-asserted-by":"crossref","unstructured":"Li, W., Lin, Z., Zhou, K., Qi, L., Wang, Y., & Jia, J. (2022). Mat: Mask-aware transformer for large hole image inpainting. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 10758-10768).","DOI":"10.1109\/CVPR52688.2022.01049"},{"key":"1977_CR110","doi-asserted-by":"crossref","unstructured":"Li, W., Yu, X., Zhou, K., Song, Y., Lin, Z., & Jia, J. (2022). Sdm: Spatial diffusion model for large hole image inpainting. arXiv preprint arXiv:2212.02963","DOI":"10.1109\/CVPR52688.2022.01049"},{"key":"1977_CR111","doi-asserted-by":"crossref","unstructured":"Li, Y., Liu, S., Yang, J., & Yang, M. H. (2017). Generative face completion. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 3911-3919).","DOI":"10.1109\/CVPR.2017.624"},{"key":"1977_CR112","doi-asserted-by":"crossref","unstructured":"Li, Y., Jiang, B., Lu, Y., & Shen, L. (2019). Fine-grained adversarial image inpainting with super resolution. In 2019 International Joint Conference on Neural Networks (IJCNN) (pp. 1-8). IEEE.","DOI":"10.1109\/IJCNN.2019.8852241"},{"key":"1977_CR113","doi-asserted-by":"crossref","unstructured":"Li, Z., Lu, C. Z., Qin, J., Guo, C. L., & Cheng, M. M. (2022). Towards an end-to-end framework for flow-guided video inpainting. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 17562-17571).","DOI":"10.1109\/CVPR52688.2022.01704"},{"key":"1977_CR114","first-page":"382","volume":"11361","author":"H Liao","year":"2018","unstructured":"Liao, H., Funka-Lea, G., Zheng, Y., Luo, J., & Zhou, S. K. (2018). Face Completion with Semantic Knowledge and Collaborative Adversarial Learning. Asian Conf. Comput. Vis., 11361, 382\u2013397.","journal-title":"Asian Conference on Computer Vision"},{"key":"1977_CR115","doi-asserted-by":"crossref","unstructured":"Liao, L., Hu, R., Xiao, J., & Wang, Z. (2018). Edge-aware context encoder for image inpainting. In 2018 IEEE International conference on acoustics, speech and signal processing (ICASSP) (pp. 3156-3160). IEEE.","DOI":"10.1109\/ICASSP.2018.8462549"},{"key":"1977_CR116","doi-asserted-by":"crossref","unstructured":"Liao, L., Xiao, J., Wang, Z., Lin, C. W., & Satoh, S. I. (2020). Guidance and evaluation: Semantic-aware image inpainting for mixed scenes. In Computer Vision-ECCV 2020: 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part XXVII 16 (pp. 683-700). Springer International Publishing.","DOI":"10.1007\/978-3-030-58583-9_41"},{"key":"1977_CR117","doi-asserted-by":"crossref","unstructured":"Liao, L., Xiao, J., Wang, Z., Lin, C. W., & Satoh, S. I. (2021a). Image inpainting guided by coherence priors of semantics and textures. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 6539-6548).","DOI":"10.1109\/CVPR46437.2021.00647"},{"issue":"2","key":"1977_CR118","doi-asserted-by":"publisher","first-page":"310","DOI":"10.1109\/JSTSP.2020.3045627","volume":"15","author":"L Liao","year":"2021","unstructured":"Liao, L., Xiao, J., Wang, Z., Lin, C. W., & Satoh, S. (2021). Uncertainty-aware semantic guidance and estimation for image inpainting. IEEE J Selected Topics Sign Process, 15(2), 310\u2013323.","journal-title":"IEEE Journal of Selected Topics in Signal Processing"},{"key":"1977_CR119","unstructured":"Lim, J.H., & Ye, J.C. (2017). Geometric gan. arXiv preprint arXiv:1705.02894"},{"key":"1977_CR120","doi-asserted-by":"crossref","unstructured":"Lin, J., Gan, C., & Han, S. (2019). Tsm: Temporal shift module for efficient video understanding. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 7083-7093).","DOI":"10.1109\/ICCV.2019.00718"},{"key":"1977_CR121","doi-asserted-by":"crossref","unstructured":"Lin, Q., Yan, B., Li, J., & Tan, W. (2020, October). Mmfl: Multimodal fusion learning for text-guided image inpainting. In Proceedings of the 28th ACM international conference on multimedia (pp. 1094-1102).","DOI":"10.1145\/3394171.3413982"},{"key":"1977_CR122","doi-asserted-by":"crossref","unstructured":"Liu, G., Reda, F. A., Shih, K. J., Wang, T. C., Tao, A., & Catanzaro, B. (2018). Image inpainting for irregular holes using partial convolutions. In Proceedings of the European conference on computer vision (ECCV) (pp. 85-100).","DOI":"10.1007\/978-3-030-01252-6_6"},{"key":"1977_CR123","doi-asserted-by":"crossref","unstructured":"Liu, H., Jiang, B., Xiao, Y., & Yang, C. (2019). Coherent semantic attention for image inpainting. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 4170-4179).","DOI":"10.1109\/ICCV.2019.00427"},{"key":"1977_CR124","doi-asserted-by":"crossref","unstructured":"Liu, H., Jiang, B., Song, Y., Huang, W., & Yang, C. (2020). Rethinking image inpainting via a mutual encoder-decoder with feature equalizations. In Computer Vision-ECCV 2020: 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part II 16 (pp. 725-741). Springer International Publishing.","DOI":"10.1007\/978-3-030-58536-5_43"},{"key":"1977_CR125","doi-asserted-by":"crossref","unstructured":"Liu, H., Wan, Z., Huang, W., Song, Y., Han, X., & Liao, J. (2021). Pd-gan: Probabilistic diverse gan for image inpainting. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 9371-9381).","DOI":"10.1109\/CVPR46437.2021.00925"},{"key":"1977_CR126","doi-asserted-by":"crossref","unstructured":"Liu, R., Deng, H., Huang, Y., Shi, X., Lu, L., Sun, W., & Li, H. (2021). Fuseformer: Fusing fine-grained information in transformers for video inpainting. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 14040-14049).","DOI":"10.1109\/ICCV48922.2021.01378"},{"key":"1977_CR127","doi-asserted-by":"crossref","unstructured":"Liu, T., Liao, L., Wang, Z., & Satoh, S. I. (2022). Reference-guided texture and structure inference for image inpainting. In 2022 IEEE international conference on image processing (ICIP) (pp. 1996-2000). IEEE.","DOI":"10.1109\/ICIP46576.2022.9897592"},{"key":"1977_CR128","doi-asserted-by":"publisher","first-page":"81","DOI":"10.1016\/j.patrec.2020.12.008","volume":"143","author":"W Liu","year":"2021","unstructured":"Liu, W., Cao, C., Liu, J., Ren, C., Wei, Y., & Guo, H. (2021). Fine-grained image inpainting with scale-enhanced generative adversarial network. Pattern Recognition Letters, 143: 81\u201387.","journal-title":"Pattern Recognition Letters"},{"key":"1977_CR129","doi-asserted-by":"crossref","unstructured":"Liu, Z., Luo, P., Wang, X., & Tang, X. (2015). Deep learning face attributes in the wild. In Proceedings of the IEEE international conference on computer vision (pp. 3730-3738).","DOI":"10.1109\/ICCV.2015.425"},{"key":"1977_CR130","doi-asserted-by":"crossref","unstructured":"Liu, Z., Lin, Y., Cao, Y., Hu, H., Wei, Y., Zhang, Z., & Guo, B. (2021). Swin transformer: Hierarchical vision transformer using shifted windows. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 10012-10022).","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"1977_CR131","doi-asserted-by":"crossref","unstructured":"Lu, Z., Jiang, J., Huang, J., Wu, G., & Liu, X. (2022). Glama: Joint spatial and frequency loss for general image inpainting. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 1301-1310).","DOI":"10.1109\/CVPRW56347.2022.00136"},{"key":"1977_CR132","doi-asserted-by":"crossref","unstructured":"Lugmayr, A., Danelljan, M., Van Gool, L., & Timofte, R. (2020). Srflow: Learning the super-resolution space with normalizing flow. In Computer Vision-ECCV 2020: 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part V 16 (pp. 715-732). Springer International Publishing.","DOI":"10.1007\/978-3-030-58558-7_42"},{"key":"1977_CR133","doi-asserted-by":"crossref","unstructured":"Lugmayr, A., Danelljan, M., Romero, A., Yu, F., Timofte, R., & Van Gool, L. (2022). Repaint: Inpainting using denoising diffusion probabilistic models. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR52688.2022.01117"},{"key":"1977_CR134","doi-asserted-by":"crossref","unstructured":"Ma, Y., Liu, X., Bai, S., Wang, L., He, D., & Liu, A. (2019, August). Coarse-to-fine image inpainting via region-wise convolutions and non-local correlation. In Ijcai (pp. 3123-3129).","DOI":"10.24963\/ijcai.2019\/433"},{"issue":"7","key":"1977_CR135","doi-asserted-by":"publisher","first-page":"674","DOI":"10.1109\/34.192463","volume":"11","author":"SG Mallat","year":"1989","unstructured":"Mallat, S. G. (1989). A theory for multiresolution signal decomposition: the wavelet representation. IEEE Trans Pattern Anal Mach Intell, 11(7), 674\u2013693.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1977_CR136","doi-asserted-by":"crossref","unstructured":"Mao, X., Li, Q., Xie, H., Lau, R. Y., Wang, Z., & Paul Smolley, S. (2017). Least squares generative adversarial networks. In Proceedings of the IEEE international conference on computer vision (pp. 2794-2802).","DOI":"10.1109\/ICCV.2017.304"},{"key":"1977_CR137","doi-asserted-by":"crossref","unstructured":"Masnou, S., & Morel, J. M. (1998, October). Level lines based disocclusion. In Proceedings 1998 International Conference on Image Processing. ICIP98 (Cat. No. 98CB36269) (pp. 259-263). IEEE.","DOI":"10.1109\/ICIP.1998.999016"},{"key":"1977_CR138","doi-asserted-by":"crossref","unstructured":"Navasardyan, S., & Ohanyan, M. (2020). Image inpainting with onion convolutions. In Proceedings of the Asian conference on computer vision","DOI":"10.1007\/978-3-030-69532-3_1"},{"key":"1977_CR139","doi-asserted-by":"crossref","unstructured":"Nazeri, K., Ng, E., Joseph, T., Qureshi, F., & Ebrahimi, M. (2019). Edgeconnect: Structure guided image inpainting using edge prediction. In Proceedings of the IEEE\/CVF international conference on computer vision workshops (pp. 0-0).","DOI":"10.1109\/ICCVW.2019.00408"},{"issue":"4","key":"1977_CR140","doi-asserted-by":"publisher","first-page":"1993","DOI":"10.1137\/140954933","volume":"7","author":"A Newson","year":"2014","unstructured":"Newson, A., Almansa, A., Fradet, M., Gousseau, Y., & P\u00e9rez, P. (2014). Video inpainting of complex scenes. SIAM J Imaging Sciences, 7(4), 1993\u20132019.","journal-title":"Siam Journal on Imaging Sciences"},{"key":"1977_CR141","doi-asserted-by":"crossref","unstructured":"Ni, M., Li, X., & Zuo, W. (2023). NUWA-LIP: language-guided image inpainting with defect-free VQGAN. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (pp. 14183-14192).","DOI":"10.1109\/CVPR52729.2023.01363"},{"key":"1977_CR142","doi-asserted-by":"crossref","unstructured":"Oh, S. W., Lee, S., Lee, J. Y., & Kim, S. J. (2019). Onion-peel networks for deep video completion. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 4403-4412).","DOI":"10.1109\/ICCV.2019.00450"},{"issue":"1","key":"1977_CR143","doi-asserted-by":"publisher","first-page":"51","DOI":"10.1016\/0031-3203(95)00067-4","volume":"29","author":"T Ojala","year":"1996","unstructured":"Ojala, T., & Pietik\u00e4inen M, Harwood D, (1996). A comparative study of texture measures with classification based on featured distributions. Pattern Recog, 29(1), 51\u201359.","journal-title":"Pattern Recognition"},{"issue":"7","key":"1977_CR144","doi-asserted-by":"publisher","first-page":"971","DOI":"10.1109\/TPAMI.2002.1017623","volume":"24","author":"T Ojala","year":"2002","unstructured":"Ojala, T., Pietikainen, M., & Maenpaa, T. (2002). Multiresolution gray-scale and rotation invariant texture classification with local binary patterns. IEEE Trans Pattern Anal Mach Intell, 24(7), 971\u2013987.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1977_CR145","doi-asserted-by":"crossref","unstructured":"Ouyang, H., Wang, T., & Chen, Q. (2021). Internal video inpainting by implicit long-range propagation. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 14579-14588).","DOI":"10.1109\/ICCV48922.2021.01431"},{"key":"1977_CR146","doi-asserted-by":"crossref","unstructured":"Park, T., Liu, M. Y., Wang, T. C., & Zhu, J. Y. (2019). Semantic image synthesis with spatially-adaptive normalization. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 2337-2346).","DOI":"10.1109\/CVPR.2019.00244"},{"key":"1977_CR147","doi-asserted-by":"crossref","unstructured":"Parmar, G., Singh, K.K., Zhang, R., Li, Y., Lu, J., Zhu, J.Y. (2023). Zero-shot image-to-image translation. arXiv preprint arXiv:2302.03027","DOI":"10.1145\/3588432.3591513"},{"key":"1977_CR148","doi-asserted-by":"crossref","unstructured":"Pathak, D., Krahenbuhl, P., Donahue, J., Darrell, T., & Efros, A. A. (2016). Context encoders: Feature learning by inpainting. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 2536-2544).","DOI":"10.1109\/CVPR.2016.278"},{"key":"1977_CR149","doi-asserted-by":"crossref","unstructured":"Peng, J., Liu, D., Xu, S., & Li, H. (2021). Generating diverse structure for image inpainting with hierarchical VQ-VAE. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (pp. 10770-10779)","DOI":"10.1109\/CVPR46437.2021.01063"},{"key":"1977_CR150","doi-asserted-by":"crossref","unstructured":"Perazzi, F., Pont-Tuset, J., McWilliams, B., Van Gool, L., Gross, M., & Sorkine-Hornung, A. (2016). A benchmark dataset and evaluation methodology for video object segmentation. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 724-732).","DOI":"10.1109\/CVPR.2016.85"},{"key":"1977_CR151","doi-asserted-by":"publisher","first-page":"1873","DOI":"10.1109\/LSP.2021.3109774","volume":"28","author":"SS Phutke","year":"2021","unstructured":"Phutke, S. S., & Murala, S. (2021). Diverse receptive field based adversarial concurrent encoder network for image inpainting. IEEE Sign Process Letters, 28, 1873\u20131877.","journal-title":"IEEE Signal Processing Letters"},{"key":"1977_CR152","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2020.103155","volume":"204","author":"J Qin","year":"2021","unstructured":"Qin, J., Bai, H., & Zhao, Y. (2021). Multi-scale attention network for image inpainting. Comput Vis Image Understand, 204, 103155.","journal-title":"Computer Vision Image Understanding"},{"key":"1977_CR153","doi-asserted-by":"publisher","first-page":"12997","DOI":"10.1109\/ACCESS.2021.3051982","volume":"9","author":"J Qiu","year":"2021","unstructured":"Qiu, J., Gao, Y., & Shen, M. (2021). Semantic-sca: Semantic structure image inpainting with the spatial-channel attention. IEEE Access, 9, 12997\u201313008.","journal-title":"IEEE Access"},{"key":"1977_CR154","doi-asserted-by":"publisher","first-page":"2405","DOI":"10.1109\/TIP.2022.3152624","volume":"31","author":"W Quan","year":"2022","unstructured":"Quan, W., Zhang, R., Zhang, Y., Li, Z., Wang, J., & Yan, D. M. (2022). Image inpainting with local and global refinement. IEEE Trans Image Process, 31, 2405\u20132420.","journal-title":"IEEE Transactions on Image Processing"},{"key":"1977_CR155","unstructured":"Radford, A., Metz, L., & Chintala, S. (2016). Unsupervised representation learning with deep convolutional generative adversarial networks. In The International Conference on Learning Representations"},{"key":"1977_CR156","doi-asserted-by":"crossref","unstructured":"Ren, J., Zheng, Q., Zhao, Y., Xu, X., & Li, C. (2022). Dlformer: Discrete latent transformer for video inpainting. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 3511-3520).","DOI":"10.1109\/CVPR52688.2022.00350"},{"key":"1977_CR157","first-page":"901","volume":"28","author":"JS Ren","year":"2015","unstructured":"Ren, J. S., Xu, L., Yan, Q., & Sun, W. (2015). Shepard Convolutional Neural Networks. Adv. Neural Inform. Process. Syst., 28, 901\u2013909.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"1977_CR158","doi-asserted-by":"crossref","unstructured":"Ren, Y., Yu, X., Zhang, R., Li, T. H., Liu, S., & Li, G. (2019). Structureflow: Image inpainting via structure-aware appearance flow. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 181-190).","DOI":"10.1109\/ICCV.2019.00027"},{"key":"1977_CR159","unstructured":"Rezende, D., & Mohamed, S. (2015). Variational inference with normalizing flows. In International conference on machine learning (pp. 1530-1538)."},{"key":"1977_CR160","doi-asserted-by":"crossref","unstructured":"Richardson, E., Alaluf, Y., Patashnik, O., Nitzan, Y., Azar, Y., Shapiro, S., & Cohen-Or, D. (2021). Encoding in style: a stylegan encoder for image-to-image translation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 2287-2296).","DOI":"10.1109\/CVPR46437.2021.00232"},{"key":"1977_CR161","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P., & Ommer, B. (2022). High-resolution image synthesis with latent diffusion models. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 10684-10695).","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"1977_CR162","unstructured":"R\u00f6ssler, A., Cozzolino, D., Verdoliva, L., Riess, C., Thies, J., Nie\u00dfner, M. (2018). Faceforensics: A large-scale video dataset for forgery detection in human faces. arXiv preprint arXiv:1803.09179"},{"issue":"2","key":"1977_CR163","doi-asserted-by":"publisher","DOI":"10.1117\/1.JEI.30.2.023016","volume":"30","author":"H Roy","year":"2021","unstructured":"Roy, H., Chaudhury, S., Yamasaki, T., & Hashimoto, T. (2021). Image inpainting using frequency-domain priors. J Electronic Imaging, 30(2), 023016.","journal-title":"Journal of Electronic Imaging"},{"key":"1977_CR164","doi-asserted-by":"crossref","unstructured":"Ruder, M., Dosovitskiy, A., & Brox, T. (2016). Artistic style transfer for videos. In Pattern Recognition: 38th German Conference, GCPR 2016, Hannover, Germany, September 12-15, 2016, Proceedings 38 (pp. 26-36). Springer International Publishing.","DOI":"10.1007\/978-3-319-45886-1_3"},{"issue":"1","key":"1977_CR165","doi-asserted-by":"publisher","first-page":"259","DOI":"10.1016\/0167-2789(92)90242-F","volume":"60","author":"LI Rudin","year":"1992","unstructured":"Rudin, L. I., Osher, S., & Fatemi, E. (1992). Nonlinear total variation based noise removal algorithms. Physica D: Nonlinear Phenomena, 60(1), 259\u2013268.","journal-title":"Physica D: Nonlinear Phenomena"},{"key":"1977_CR166","doi-asserted-by":"crossref","unstructured":"Sagong, M. C., Shin, Y. G., Kim, S. W., Park, S., & Ko, S. J. (2019). Pepsi: Fast image inpainting with parallel decoding network. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 11360-11368).","DOI":"10.1109\/CVPR.2019.01162"},{"key":"1977_CR167","doi-asserted-by":"crossref","unstructured":"Saharia, C., Chan, W., Chang, H., Lee, C., Ho, J., Salimans, T., & Norouzi, M. (2022). Palette: Image-to-image diffusion models. In ACM SIGGRAPH 2022 conference proceedings (pp. 1-10).","DOI":"10.1145\/3528233.3530757"},{"key":"1977_CR168","first-page":"36479","volume":"35","author":"C Saharia","year":"2022","unstructured":"Saharia, C., Chan, W., Saxena, S., Li, L., Whang, J., Denton, E. L., & Norouzi, M. (2022). Photorealistic text-to-image diffusion models with deep language understanding. Advances in Neural Information Processing Systems, 35, 36479\u201336494.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"1977_CR169","doi-asserted-by":"crossref","unstructured":"Schrader, K., Peter, P., K\u00e4amper, N., & Weickert, J. (2023). Efficient neural generation of 4k masks for homogeneous diffusion inpainting. In International conference on scale space and variational methods in computer vision (pp. 16-28).","DOI":"10.1007\/978-3-031-31975-4_2"},{"key":"1977_CR170","first-page":"25278","volume":"35","author":"C Schuhmann","year":"2022","unstructured":"Schuhmann C, Beaumont R, Vencu R, Gordon CW, Wightman R, Cherti M, Coombes T, Katta A, Mullis C, Wortsman M, Schramowski P, Kundurthy SR, Crowson K, Schmidt L, Kaczmarczyk R, Jitsev J (2022) LAION-5B: An open large-scale dataset for training next generation image-text models. Advances in Neural Information Processing Systems, 35, 25278\u201325294.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"1977_CR171","volume":"87","author":"H Shao","year":"2020","unstructured":"Shao, H., Wang, Y., Fu, Y., & Yin, Z. (2020). Generative image inpainting via edge structure and color aware fusion. Sign Process: Image Communication, 87, 115929.","journal-title":"Signal Process: Image Communication"},{"key":"1977_CR172","doi-asserted-by":"crossref","unstructured":"Shen, L., Hong, R., Zhang, H., Zhang, H., & Wang, M. (2019). Single-shot semantic image inpainting with densely connected generative networks. In Proceedings of the 27th ACM International Conference on Multimedia (pp. 1861-1869).","DOI":"10.1145\/3343031.3350903"},{"issue":"1","key":"1977_CR173","doi-asserted-by":"publisher","first-page":"252","DOI":"10.1109\/TNNLS.2020.2978501","volume":"32","author":"YG Shin","year":"2021","unstructured":"Shin, Y. G., Sagong, M. C., Yeo, Y. J., Kim, S. W., & Ko, S. J. (2021). Pepsi++: Fast and lightweight network for image inpainting. IEEE Trans Neural Networks Learn Syst, 32(1), 252\u2013265.","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"key":"1977_CR174","doi-asserted-by":"crossref","unstructured":"Shukla, T., Maheshwari, P., Singh, R., Shukla, A., Kulkarni, K., & Turaga, P. (2023). Scene graph driven text-prompt generation for image inpainting. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 759-768).","DOI":"10.1109\/CVPRW59228.2023.00083"},{"key":"1977_CR175","unstructured":"Simonyan, K., & Zisserman, A. (2014). Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556"},{"key":"1977_CR176","unstructured":"Sohl-Dickstein, J., Weiss, E., Maheswaranathan, N., & Ganguli, S. (2015). Deep unsupervised learning using nonequilibrium thermodynamics. In International conference on machine learning (pp. 2256-2265). PMLR."},{"key":"1977_CR177","doi-asserted-by":"crossref","unstructured":"Song, L., Cao, J., Song, L., Hu, Y., & He, R. (2019). Geometry-aware face completion and editing. In Proceedings of the AAAI conference on artificial intelligence (Vol. 33, No. 01, pp. 2506-2513).","DOI":"10.1609\/aaai.v33i01.33012506"},{"key":"1977_CR178","doi-asserted-by":"crossref","unstructured":"Song, Y., Yang, C., Lin, Z., Liu, X., Huang, Q., Li, H., & Kuo, C. C. J. (2018). Contextual-based image inpainting: Infer, match, and translate. In Proceedings of the European conference on computer vision (ECCV) (pp. 3-19).","DOI":"10.1007\/978-3-030-01216-8_1"},{"key":"1977_CR179","unstructured":"Song, Y., Yang, C., Shen, Y., Wang, P., Huang, Q., & Kuo, C. C. J. (2018b). SPG-Net: Segmentation prediction and guidance network for image inpainting. In: Brit. Mach. Vis. Conf."},{"key":"1977_CR180","doi-asserted-by":"crossref","unstructured":"Sun, D., Yang, X., Liu, M. Y., & Kautz, J. (2018). Pwc-net: Cnns for optical flow using pyramid, warping, and cost volume. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 8934-8943).","DOI":"10.1109\/CVPR.2018.00931"},{"key":"1977_CR181","doi-asserted-by":"crossref","unstructured":"Sun, K., Xiao, B., Liu, D., & Wang, J. (2019). Deep high-resolution representation learning for human pose estimation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 5693-5703).","DOI":"10.1109\/CVPR.2019.00584"},{"key":"1977_CR182","doi-asserted-by":"crossref","unstructured":"Sun, Q., Ma, L., Oh, S. J., Van Gool, L., Schiele, B., & Fritz, M. (2018b). Natural and effective obfuscation by head inpainting. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 5050-5059).","DOI":"10.1109\/CVPR.2018.00530"},{"key":"1977_CR183","doi-asserted-by":"crossref","unstructured":"Suvorov, R., Logacheva, E., Mashikhin, A., Remizova, A., Ashukha, A., Silvestrov, A., & Lempitsky, V. (2022). Resolution-robust large mask inpainting with fourier convolutions. In Proceedings of the IEEE\/CVF winter conference on applications of computer vision (pp. 2149-2159).","DOI":"10.1109\/WACV51458.2022.00323"},{"issue":"1","key":"1977_CR184","doi-asserted-by":"publisher","first-page":"217","DOI":"10.4310\/CMS.2010.v8.n1.a11","volume":"8","author":"EG Tabak","year":"2010","unstructured":"Tabak, E. G., & Vanden-Eijnden, E. (2010). Density estimation by dual ascent of the log-likelihood. Commun Math Sci, 8(1), 217\u2013233.","journal-title":"Communications in Mathematical Sciences"},{"issue":"4","key":"1977_CR185","doi-asserted-by":"publisher","first-page":"506","DOI":"10.1109\/TPAMI.2005.87","volume":"27","author":"D Tschumperl\u00e9","year":"2005","unstructured":"Tschumperl\u00e9, D., & Deriche, R. (2005). Vector-valued image regularization with pdes: a common framework for different applications. IEEE Trans Pattern Anal Mach Intell, 27(4), 506\u2013517.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1977_CR186","doi-asserted-by":"crossref","unstructured":"Tu, C. T., & Chen, Y. F. (2019, August). Facial image inpainting with variational autoencoder. In 2019 2nd international conference of intelligent robotic and control engineering (IRCE) (pp. 119-122). IEEE.","DOI":"10.1109\/IRCE.2019.00031"},{"key":"1977_CR187","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A. N., & Polosukhin, I. (2017). Attention is all you need. Advances in Neural Information Processing Systems, 30."},{"key":"1977_CR188","doi-asserted-by":"crossref","unstructured":"Vo, H. V., Duong, N. Q., & P\u00e9rez, P. (2018). Structural inpainting. In Proceedings of the 26th ACM international conference on multimedia (pp. 1948-1956).","DOI":"10.1145\/3240508.3240678"},{"key":"1977_CR189","doi-asserted-by":"crossref","unstructured":"Wadhwa, G., Dhall, A., Murala, S., & Tariq, U. (2021). Hyperrealistic image inpainting with hypergraphs. In Proceedings of the IEEE\/CVF winter conference on applications of computer vision (pp. 3912-3921).","DOI":"10.1109\/WACV48630.2021.00396"},{"key":"1977_CR190","doi-asserted-by":"crossref","unstructured":"Wan, Z., Zhang, B., Chen, D., Zhang, P., Chen, D., Liao, J., & Wen, F. (2020). Bringing old photos back to life. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 2747-2757).","DOI":"10.1109\/CVPR42600.2020.00282"},{"key":"1977_CR191","doi-asserted-by":"crossref","unstructured":"Wan, Z., Zhang, J., Chen, D., & Liao, J. (2021). High-fidelity pluralistic image completion with transformers. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 4692-4701).","DOI":"10.1109\/ICCV48922.2021.00465"},{"key":"1977_CR192","doi-asserted-by":"crossref","unstructured":"Wang, C., Huang, H., Han, X., & Wang, J. (2019). Video inpainting by jointly learning temporal structure and spatial details. In Proceedings of the AAAI conference on artificial intelligence (pp. 5232-5239).","DOI":"10.1609\/aaai.v33i01.33015232"},{"key":"1977_CR193","doi-asserted-by":"crossref","unstructured":"Wang, C., Zhu, Y., & Yuan, C. (2022). Diverse Image Inpainting with Normalizing Flow. In European conference on computer vision (pp. 53-69).","DOI":"10.1007\/978-3-031-20050-2_4"},{"key":"1977_CR194","doi-asserted-by":"crossref","unstructured":"Wang, J., Wang, C., Huang, Q., Shi, Y., Cai, J. F., Zhu, Q., & Yin, B. (2020). Image inpainting based on multi-frequency probabilistic inference model. In Proceedings of the 28th ACM international conference on multimedia (pp. 1-9).","DOI":"10.1145\/3394171.3413891"},{"key":"1977_CR195","doi-asserted-by":"crossref","unstructured":"Wang, N., Li, J., Zhang, L., & Du, B. (2019). MUSICAL: Multi-scale image contextual attention learning for inpainting. In: IJCAI (pp. 3748-3754).","DOI":"10.24963\/ijcai.2019\/520"},{"key":"1977_CR196","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107448","volume":"106","author":"N Wang","year":"2020","unstructured":"Wang, N., Ma, S., Li, J., Zhang, Y., & Zhang, L. (2020). Multistage attention network for image inpainting. Pattern Recog, 106, 107448.","journal-title":"Pattern Recognition"},{"key":"1977_CR197","doi-asserted-by":"publisher","first-page":"1784","DOI":"10.1109\/TIP.2020.3048629","volume":"30","author":"N Wang","year":"2021","unstructured":"Wang, N., Zhang, Y., & Zhang, L. (2021). Dynamic selection network for image inpainting. IEEE Trans Image Process, 30, 1784\u20131798.","journal-title":"IEEE Transactions on Image Processing"},{"key":"1977_CR198","doi-asserted-by":"crossref","unstructured":"Wang, S., Saharia, C., Montgomery, C., Pont-Tuset, J., Noy, S., Pellegrini, S., & Chan, W. (2023). Imagen editor and editbench: Advancing and evaluating text-guided image inpainting. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 18359-18369).","DOI":"10.1109\/CVPR52729.2023.01761"},{"key":"1977_CR199","doi-asserted-by":"crossref","unstructured":"Wang, T., Ouyang, H., & Chen, Q. (2021). Image inpainting with external-internal learning and monochromic bottleneck. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 5120-5129).","DOI":"10.1109\/CVPR46437.2021.00508"},{"key":"1977_CR200","unstructured":"Wang, T. C., Liu, M. Y., Zhu, J. Y., Liu, G., Tao, A., Kautz, J., & Catanzaro, B. (2018a). Video-to-Video Synthesis. AAdvances in Neural Information Processing Systems, 31"},{"key":"1977_CR201","doi-asserted-by":"crossref","unstructured":"Wang, W., Zhang, J., Niu, L., Ling, H., Yang, X., & Zhang, L. (2021). Parallel multi-resolution fusion network for image inpainting. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 14559-14568).","DOI":"10.1109\/ICCV48922.2021.01429"},{"key":"1977_CR202","doi-asserted-by":"crossref","unstructured":"Wang, W., Niu, L., Zhang, J., Yang, X., & Zhang, L. (2022b). Dual-path image inpainting with auxiliary gan inversion. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 11421-11430).","DOI":"10.1109\/CVPR52688.2022.01113"},{"key":"1977_CR203","doi-asserted-by":"crossref","unstructured":"Wang, X., Girshick, R., Gupta, A., & He, K. (2018). Non-local neural networks. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 7794-7803).","DOI":"10.1109\/CVPR.2018.00813"},{"key":"1977_CR204","unstructured":"Wang, Y., Tao, X., Qi, X., Shen, X., & Jia, J. (2018). Image inpainting via generative multi-column convolutional neural networks. Advances in Neural Information Processing Systems, 31."},{"key":"1977_CR205","doi-asserted-by":"crossref","unstructured":"Wang, Y., Chen, Y. C., Tao, X., & Jia, J. (2020). Vcnet: A robust approach to blind image inpainting. In Computer Vision-ECCV 2020: 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part XXV 16 (pp. 752-768). Springer International Publishing.","DOI":"10.1007\/978-3-030-58595-2_45"},{"key":"1977_CR206","unstructured":"Wang, Z., Simoncelli, E. P., & Bovik, A. C. (2003, November). Multiscale structural similarity for image quality assessment. In The Thrity-seventh asilomar conference on signals, systems & computers, 2003 (Vol. 2, pp. 1398-1402). Ieee."},{"issue":"4","key":"1977_CR207","doi-asserted-by":"publisher","first-page":"600","DOI":"10.1109\/TIP.2003.819861","volume":"13","author":"Z Wang","year":"2004","unstructured":"Wang, Z., Bovik, A. C., Sheikh, H. R., & Simoncelli, E. P. (2004). Image quality assessment: from error visibility to structural similarity. IEEE Trans Image Process, 13(4), 600\u2013612.","journal-title":"IEEE Transactions on Image Processing"},{"key":"1977_CR208","doi-asserted-by":"crossref","unstructured":"Weng, Y., Ding, S., & Zhou, T. (2022). A survey on improved GAN based image inpainting. In 2022 2nd international conference on consumer electronics and computer engineering (ICCECE) (pp. 319-322). IEEE.","DOI":"10.1109\/ICCECE54139.2022.9712740"},{"issue":"3","key":"1977_CR209","doi-asserted-by":"publisher","first-page":"463","DOI":"10.1109\/TPAMI.2007.60","volume":"29","author":"Y Wexler","year":"2007","unstructured":"Wexler, Y., Shechtman, E., & Irani, M. (2007). Space-time completion of video. IEEE Trans Pattern Anal Mach Intell, 29(3), 463\u2013476.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1977_CR210","unstructured":"Woo, S., Kim, D., Park, K., Lee, J. Y., & Kweon, I. S. (2019). Align-and-attend network for globally and locally coherent video inpainting. In The British Machine Vision Conference (BMVC) (pp.1\u201313)"},{"key":"1977_CR211","doi-asserted-by":"publisher","first-page":"4016","DOI":"10.1109\/TMM.2021.3111491","volume":"24","author":"H Wu","year":"2022","unstructured":"Wu, H., Zhou, J., & Li, Y. (2022). Deep generative model for image inpainting with local binary pattern learning and spatial attention. IEEE Trans Multimedia, 24, 4016\u20134027.","journal-title":"IEEE Transactions on Multimedia"},{"key":"1977_CR212","doi-asserted-by":"crossref","unstructured":"Wu, L., Zhang, C., Liu, J., Han, J., Liu, J., Ding, E., Bai, X. (2019). Editing text in the wild. In ngs of the 27th ACM international conference on multimedia(pp. 1500-1508).","DOI":"10.1145\/3343031.3350929"},{"key":"1977_CR213","doi-asserted-by":"crossref","unstructured":"Wu X, Xie Y, Zeng J, Yang Z, Yu Y, Li Q, Liu W (2021) Adversarial learning with mask reconstruction for text-guided image inpainting. In: ACM Int. Conf. Multimedia, pp 3464\u20133472","DOI":"10.1145\/3474085.3475506"},{"key":"1977_CR214","doi-asserted-by":"crossref","unstructured":"Xia W, Zhang Y, Yang Y, Xue JH, Zhou B, Yang MH (2022) Gan inversion: A survey. IEEE Trans Pattern Anal Mach Intell pp 1\u201317","DOI":"10.1109\/TPAMI.2022.3181070"},{"key":"1977_CR215","doi-asserted-by":"crossref","unstructured":"Xie C, Liu S, Li C, Cheng MM, Zuo W, Liu X, Wen S, Ding E (2019) Image Inpainting with Learnable Bidirectional Attention Maps. In: Int. Conf. Comput. Vis., pp 8858\u20138867","DOI":"10.1109\/ICCV.2019.00895"},{"key":"1977_CR216","doi-asserted-by":"crossref","unstructured":"Xie M, Li C, Liu X, Wong TT (2020) Manga filling style conversion with screentone variational autoencoder. ACM Trans Graph 39(6)","DOI":"10.1145\/3414685.3417873"},{"key":"1977_CR217","doi-asserted-by":"crossref","unstructured":"Xie M, Xia M, Liu X, Li C, Wong TT (2021) Seamless manga inpainting with semantics awareness. ACM Trans Graph 40(4)","DOI":"10.1145\/3450626.3459822"},{"key":"1977_CR218","doi-asserted-by":"crossref","unstructured":"Xie S, Zhang Z, Lin Z, Hinz T, Zhang K (2023) SmartBrush: Text and Shape Guided Object Inpainting With Diffusion Model. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 22428\u201322437","DOI":"10.1109\/CVPR52729.2023.02148"},{"issue":"9\u201310","key":"1977_CR219","doi-asserted-by":"publisher","first-page":"3149","DOI":"10.1007\/s00371-022-02523-0","volume":"38","author":"Y Xie","year":"2022","unstructured":"Xie, Y., Lin, Z., Yang, Z., Deng, H., Wu, X., Mao, X., Li, Q., & Liu, W. (2022). Learning semantic alignment from image for text-guided image inpainting. The Visual Computer, 38(9\u201310), 3149\u20133161.","journal-title":"The Visual Computer"},{"key":"1977_CR220","doi-asserted-by":"crossref","unstructured":"Xiong W, Yu J, Lin Z, Yang J, Lu X, Barnes C, Luo J (2019) Foreground-Aware Image Inpainting. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 5833\u20135841","DOI":"10.1109\/CVPR.2019.00599"},{"key":"1977_CR221","doi-asserted-by":"crossref","unstructured":"Xu N, Yang L, Fan Y, Yang J, Yue D, Liang Y, Price B, Cohen S, Huang T (2018a) YouTube-VOS: Sequence-to-Sequence Video Object Segmentation. In: Eur. Conf. Comput. Vis., pp 585\u2013601","DOI":"10.1007\/978-3-030-01228-1_36"},{"key":"1977_CR222","doi-asserted-by":"crossref","unstructured":"Xu R, Li X, Zhou B, Loy CC (2019) Deep flow-guided video inpainting. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 3723\u20133732","DOI":"10.1109\/CVPR.2019.00384"},{"key":"1977_CR223","doi-asserted-by":"publisher","first-page":"9112","DOI":"10.1109\/TIP.2021.3122930","volume":"30","author":"R Xu","year":"2021","unstructured":"Xu, R., Guo, M., Wang, J., Li, X., Zhou, B., & Loy, C. C. (2021). Texture memory-augmented deep patch-based image inpainting. IEEE Trans Image Process, 30, 9112\u20139124.","journal-title":"IEEE Transactions on Image Processing"},{"key":"1977_CR224","doi-asserted-by":"crossref","unstructured":"Xu T, Zhang P, Huang Q, Zhang H, Gan Z, Huang X, He X (2018b) Attngan: Fine-grained text to image generation with attentional generative adversarial networks. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 1316\u20131324","DOI":"10.1109\/CVPR.2018.00143"},{"key":"1977_CR225","doi-asserted-by":"crossref","unstructured":"Yamashita Y, Shimosato K, Ukita N (2022) Boundary-Aware Image Inpainting With Multiple Auxiliary Cues. In: IEEE Conf. Comput. Vis. Pattern Recog. Worksh., pp 619\u2013629","DOI":"10.1109\/CVPRW56347.2022.00077"},{"key":"1977_CR226","doi-asserted-by":"crossref","unstructured":"Yan Z, Li X, Li M, Zuo W, Shan S (2018) Shift-Net: Image Inpainting via Deep Feature Rearrangement. In: Eur. Conf. Comput. Vis., pp 3\u201319","DOI":"10.1007\/978-3-030-01264-9_1"},{"key":"1977_CR227","doi-asserted-by":"crossref","unstructured":"Yang C, Lu X, Lin Z, Shechtman E, Wang O, Li H (2017) High-resolution image inpainting using multi-scale neural patch synthesis. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 6721\u20136729","DOI":"10.1109\/CVPR.2017.434"},{"key":"1977_CR228","first-page":"12605","volume":"34","author":"J Yang","year":"2020","unstructured":"Yang, J., Qi, Z., & Shi, Y. (2020). Learning to Incorporate Structure Knowledge for Image Inpainting. AAAI Conf. Artificial Intell., 34, 12605\u201312612.","journal-title":"AAAI Conf. Artificial Intell."},{"key":"1977_CR229","unstructured":"Yang L, Zhang Z, Song Y, Hong S, Xu R, Zhao Y, Zhang W, Cui B, Yang MH (2023) Diffusion models: A comprehensive survey of methods and applications. arxiv:2209.00796"},{"key":"1977_CR230","doi-asserted-by":"crossref","unstructured":"Yeh RA, Chen C, Lim TY, Schwing AG, Hasegawa-Johnson M, Do MN (2017) Semantic Image Inpainting with Deep Generative Models. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 6882\u20136890","DOI":"10.1109\/CVPR.2017.728"},{"key":"1977_CR231","doi-asserted-by":"crossref","unstructured":"Yi Z, Tang Q, Azizi S, Jang D, Xu Z (2020) Contextual Residual Aggregation for Ultra High-Resolution Image Inpainting. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 7508\u20137517","DOI":"10.1109\/CVPR42600.2020.00753"},{"key":"1977_CR232","unstructured":"Yu F, Koltun V (2016) Multi-Scale Context Aggregation by Dilated Convolutions. In: Int. Conf. Learn. Represent."},{"key":"1977_CR233","doi-asserted-by":"crossref","unstructured":"Yu J, Lin Z, Yang J, Shen X, Lu X, Huang TS (2018) Generative image inpainting with contextual attention. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 5505\u20135514","DOI":"10.1109\/CVPR.2018.00577"},{"key":"1977_CR234","doi-asserted-by":"crossref","unstructured":"Yu J, Lin Z, Yang J, Shen X, Lu X, Huang TS (2019) Free-form image inpainting with gated convolution. In: Int. Conf. Comput. Vis., pp 4471\u20134480","DOI":"10.1109\/ICCV.2019.00457"},{"key":"1977_CR235","doi-asserted-by":"crossref","unstructured":"Yu T, Guo Z, Jin X, Wu S, Chen Z, Li W, Zhang Z, Liu S (2020) Region Normalization for Image Inpainting. In: AAAI Conf. Artificial Intell., pp 12733\u201312740","DOI":"10.1609\/aaai.v34i07.6967"},{"key":"1977_CR236","doi-asserted-by":"crossref","unstructured":"Yu Y, Zhan F, Lu S, Pan J, Ma F, Xie X, Miao C (2021a) WaveFill: A Wavelet-Based Generation Network for Image Inpainting. In: Int. Conf. Comput. Vis., pp 14114\u201314123","DOI":"10.1109\/ICCV48922.2021.01385"},{"key":"1977_CR237","doi-asserted-by":"crossref","unstructured":"Yu Y, Zhan F, WU R, Pan J, Cui K, Lu S, Ma F, Xie X, Miao C (2021b) Diverse Image Inpainting with Bidirectional and Autoregressive Transformers. In: ACM Int. Conf. Multimedia, p 69-78","DOI":"10.1145\/3474085.3475436"},{"key":"1977_CR238","doi-asserted-by":"crossref","unstructured":"Yu Y, Du D, Zhang L, Luo T (2022a) Unbiased Multi-modality Guidance for Image Inpainting. In: Eur. Conf. Comput. Vis., pp 668\u2013684","DOI":"10.1007\/978-3-031-19787-1_38"},{"key":"1977_CR239","doi-asserted-by":"crossref","unstructured":"Yu Y, Zhang L, Fan H, Luo T (2022b) High-Fidelity Image Inpainting with GAN Inversion. In: Eur. Conf. Comput. Vis., pp 242\u2013258","DOI":"10.1007\/978-3-031-19787-1_14"},{"key":"1977_CR240","doi-asserted-by":"crossref","unstructured":"Zeng Y, Fu J, Chao H, Guo B (2019) Learning pyramid-context encoder network for high-quality image inpainting. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 1486\u20131494","DOI":"10.1109\/CVPR.2019.00158"},{"key":"1977_CR241","doi-asserted-by":"crossref","unstructured":"Zeng, Y., Fu, J., & Chao, H. (2020). Learning Joint Spatial-Temporal Transformations for Video Inpainting. Eur (pp. 528\u2013543). Conf. Comput. Vis.: Springer.","DOI":"10.1007\/978-3-030-58517-4_31"},{"key":"1977_CR242","doi-asserted-by":"crossref","unstructured":"Zeng Y, Lin Z, Yang J, Zhang J, Shechtman E, Lu H (2020b) High-Resolution Image Inpainting with Iterative Confidence Feedback and Guided Upsampling. In: Eur. Conf. Comput. Vis.","DOI":"10.1007\/978-3-030-58529-7_1"},{"key":"1977_CR243","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2021.108036","volume":"119","author":"Y Zeng","year":"2021","unstructured":"Zeng, Y., Gong, Y., & Zhang, J. (2021). Feature learning and patch matching for diverse image inpainting. Pattern Recog, 119, 108036.","journal-title":"Pattern Recog"},{"key":"1977_CR244","doi-asserted-by":"crossref","unstructured":"Zeng Y, Lin Z, Lu H, Patel VM (2021b) CR-Fill: Generative Image Inpainting With Auxiliary Contextual Reconstruction. In: Int. Conf. Comput. Vis., pp 14164\u201314173","DOI":"10.1109\/ICCV48922.2021.01390"},{"key":"1977_CR245","unstructured":"Zeng Y, Fu J, Chao H, Guo B (2022) Aggregated contextual transformations for high-resolution image inpainting. IEEE Trans Vis Comput Graph pp 1\u20131"},{"issue":"2","key":"1977_CR246","doi-asserted-by":"publisher","first-page":"533","DOI":"10.1109\/TIP.2009.2035882","volume":"19","author":"B Zhang","year":"2010","unstructured":"Zhang, B., Gao, Y., Zhao, S., & Liu, J. (2010). Local derivative pattern versus local binary pattern: Face recognition with high-order local pattern descriptor. IEEE Trans Image Process, 19(2), 533\u2013544.","journal-title":"IEEE Transactions on Image Processing"},{"key":"1977_CR247","doi-asserted-by":"crossref","unstructured":"Zhang H, Hu Z, Luo C, Zuo W, Wang M (2018a) Semantic Image Inpainting with Progressive Generative Networks. In: ACM Int. Conf. Multimedia, p 1939-1947","DOI":"10.1145\/3240508.3240625"},{"key":"1977_CR248","doi-asserted-by":"crossref","unstructured":"Zhang H, Mai L, Xu N, Wang Z, Collomosse J, Jin H (2019a) An internal learning approach to video inpainting. In: Int. Conf. Comput. Vis., pp 2720\u20132729","DOI":"10.1109\/ICCV.2019.00281"},{"key":"1977_CR249","doi-asserted-by":"crossref","unstructured":"Zhang J, Niu L, Yang D, Kang L, Li Y, Zhao W, Zhang L (2019b) GAIN: Gradient Augmented Inpainting Network for Irregular Holes. In: ACM Int. Conf. Multimedia, p 1870-1878","DOI":"10.1145\/3343031.3350912"},{"key":"1977_CR250","doi-asserted-by":"crossref","unstructured":"Zhang K, Fu J, Liu D (2022a) Flow-Guided Transformer for Video Inpainting. In: Eur. Conf. Comput. Vis., pp 74\u201390","DOI":"10.1007\/978-3-031-19797-0_5"},{"key":"1977_CR251","doi-asserted-by":"crossref","unstructured":"Zhang K, Fu J, Liu D (2022b) Inertia-Guided Flow Completion and Style Fusion for Video Inpainting. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 5982\u20135991","DOI":"10.1109\/CVPR52688.2022.00589"},{"key":"1977_CR252","doi-asserted-by":"crossref","unstructured":"Zhang L, Agrawala M (2023) Adding conditional control to text-to-image diffusion models. arxiv:2302.05543","DOI":"10.1109\/ICCV51070.2023.00355"},{"key":"1977_CR253","doi-asserted-by":"crossref","unstructured":"Zhang L, Chen Q, Hu B, Jiang S (2020a) Text-Guided Neural Image Inpainting. In: ACM Int. Conf. Multimedia, p 1302-1310","DOI":"10.1145\/3394171.3414017"},{"key":"1977_CR254","doi-asserted-by":"crossref","unstructured":"Zhang L, Barnes C, Wampler K, Amirghodsi S, Shechtman E, Lin Z, Shi J (2022c) Inpainting at Modern Camera Resolution by Guided PatchMatch with Auto-curation. In: Eur. Conf. Comput. Vis., pp 51\u201367","DOI":"10.1007\/978-3-031-19790-1_4"},{"key":"1977_CR255","first-page":"146","volume":"2022","author":"L Zhang","year":"2022","unstructured":"Zhang, L., Zhou, Y., Barnes, C., Amirghodsi, S., Lin, Z., Shechtman, E., & Shi, J. (2022). Perceptual Artifacts Localization for Inpainting. Computer Vision - ECCV, 2022, 146\u2013164.","journal-title":"Computer Vision - ECCV"},{"key":"1977_CR256","doi-asserted-by":"crossref","unstructured":"Zhang R, Isola P, Efros AA, Shechtman E, Wang O (2018b) The Unreasonable Effectiveness of Deep Features as a Perceptual Metric. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 586\u2013595","DOI":"10.1109\/CVPR.2018.00068"},{"key":"1977_CR257","doi-asserted-by":"crossref","unstructured":"Zhang R, Quan W, Wu B, Li Z, Yan DM (2020b) Pixel-wise dense detector for image inpainting. Comput Graph Forum 39(7)","DOI":"10.1111\/cgf.14160"},{"key":"1977_CR258","unstructured":"Zhang R, Quan W, Zhang Y, Wang J, Yan DM (2022e) W-net: Structure and texture interaction for image inpainting. IEEE Trans Multimedia pp 1\u201312"},{"issue":"3","key":"1977_CR259","doi-asserted-by":"publisher","first-page":"637","DOI":"10.1109\/TIFS.2017.2763119","volume":"13","author":"S Zhang","year":"2018","unstructured":"Zhang, S., He, R., Sun, Z., & Tan, T. (2018). Demeshnet: Blind face inpainting for deep meshface verification. IEEE Trans Inf Forensics Secur, 13(3), 637\u2013647.","journal-title":"IEEE Transactions on Information Forensics and Security"},{"key":"1977_CR260","doi-asserted-by":"crossref","unstructured":"Zhang W, Zhu J, Tai Y, Wang Y, Chu W, Ni B, Wang C, Yang X (2021) Context-Aware Image Inpainting with Learned Semantic Priors. In: Int. Joint Conf. Artificial Intell., pp 1323\u20131329","DOI":"10.24963\/ijcai.2021\/183"},{"key":"1977_CR261","doi-asserted-by":"crossref","unstructured":"Zhang Z, Zhao Z, Zhang Z, Huai B, Yuan J (2020c) Text-guided image inpainting. In: ACM Int. Conf. Multimedia, pp 4079\u20134087","DOI":"10.1145\/3394171.3413939"},{"key":"1977_CR262","doi-asserted-by":"crossref","unstructured":"Zhao L, Mo Q, Lin S, Wang Z, Zuo Z, Chen H, Xing W, Lu D (2020) UCTGAN: Diverse Image Inpainting Based on Unsupervised Cross-Space Translation. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 5740\u20135749","DOI":"10.1109\/CVPR42600.2020.00578"},{"key":"1977_CR263","unstructured":"Zhao S, Cui J, Sheng Y, Dong Y, Liang X, Chang EI, Xu Y (2021) Large Scale Image Completion via Co-Modulated Generative Adversarial Networks. In: Int. Conf. Learn. Represent."},{"key":"1977_CR264","doi-asserted-by":"crossref","unstructured":"Zhao W, Rao Y, Liu Z, Liu B, Zhou J, Lu J (2023) Unleashing text-to-image diffusion models for visual perception. arXiv preprint arXiv:2303.02153","DOI":"10.1109\/ICCV51070.2023.00527"},{"key":"1977_CR265","doi-asserted-by":"crossref","unstructured":"Zheng C, Cham TJ, Cai J (2019) Pluralistic Image Completion. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 1438\u20131447","DOI":"10.1109\/CVPR.2019.00153"},{"key":"1977_CR266","doi-asserted-by":"publisher","first-page":"2786","DOI":"10.1007\/s11263-021-01502-7","volume":"129","author":"C Zheng","year":"2021","unstructured":"Zheng, C., Cham, T. J., & Cai, J. (2021). Pluralistic free-form image completion. Int J Comput Vis, 129, 2786\u20132805.","journal-title":"International Journal of Computer Vision"},{"key":"1977_CR267","doi-asserted-by":"crossref","unstructured":"Zheng C, Cham TJ, Cai J, Phung D (2022a) Bridging Global Context Interactions for High-Fidelity Image Completion. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 11512\u201311522","DOI":"10.1109\/CVPR52688.2022.01122"},{"key":"1977_CR268","doi-asserted-by":"crossref","unstructured":"Zheng H, Zhang Z, Wang Y, Zhang Z, Xu M, Yang Y, Wang M (2021b) GCM-Net: Towards Effective Global Context Modeling for Image Inpainting. In: ACM Int. Conf. Multimedia, p 2586\u20132594","DOI":"10.1145\/3474085.3475433"},{"key":"1977_CR269","doi-asserted-by":"crossref","unstructured":"Zheng H, Lin Z, Lu J, Cohen S, Shechtman E, Barnes C, Zhang J, Xu N, Amirghodsi S, Luo J (2022b) Image Inpainting with Cascaded Modulation GAN and Object-Aware Training. In: Eur. Conf. Comput. Vis., pp 277\u2013296","DOI":"10.1007\/978-3-031-19787-1_16"},{"issue":"6","key":"1977_CR270","doi-asserted-by":"publisher","first-page":"1452","DOI":"10.1109\/TPAMI.2017.2723009","volume":"40","author":"B Zhou","year":"2017","unstructured":"Zhou, B., Lapedriza, A., Khosla, A., Oliva, A., & Torralba, A. (2017). Places: A 10 million image database for scene recognition. IEEE Trans Pattern Anal Mach Intell, 40(6), 1452\u20131464.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1977_CR271","doi-asserted-by":"publisher","first-page":"302","DOI":"10.1007\/s11263-018-1140-0","volume":"127","author":"B Zhou","year":"2018","unstructured":"Zhou, B., Zhao, H., Puig, X., Xiao, T., Fidler, S., Barriuso, A., & Torralba, A. (2018). Semantic understanding of scenes through the ade20k dataset. Int J Comput Vis, 127, 302\u2013321.","journal-title":"International Journal of Computer Vision"},{"key":"1977_CR272","doi-asserted-by":"crossref","unstructured":"Zhou X, Li J, Wang Z, He R, Tan T (2021) Image Inpainting with Contrastive Relation Network. In: Int. Conf. Pattern Recog., pp 4420\u20134427","DOI":"10.1109\/ICPR48806.2021.9412640"},{"key":"1977_CR273","doi-asserted-by":"publisher","first-page":"4855","DOI":"10.1109\/TIP.2021.3076310","volume":"30","author":"M Zhu","year":"2021","unstructured":"Zhu, M., He, D., Li, X., Li, C., Li, F., Liu, X., Ding, E., & Zhang, Z. (2021). Image inpainting by end-to-end cascaded refinement with mask awareness. IEEE Trans Image Process, 30, 4855\u20134866.","journal-title":"IEEE Transactions on Image Processing"},{"key":"1977_CR274","doi-asserted-by":"crossref","unstructured":"Zou X, Yang L, Liu D, Lee YJ (2021) Progressive temporal feature alignment network for video inpainting. In: IEEE Conf. Comput. Vis. Pattern Recog., pp 16448\u201316457","DOI":"10.1109\/CVPR46437.2021.01618"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-023-01977-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-023-01977-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-023-01977-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,8]],"date-time":"2024-11-08T16:19:27Z","timestamp":1731082767000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-023-01977-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,1,19]]},"references-count":274,"journal-issue":{"issue":"7","published-print":{"date-parts":[[2024,7]]}},"alternative-id":["1977"],"URL":"https:\/\/doi.org\/10.1007\/s11263-023-01977-6","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,1,19]]},"assertion":[{"value":"15 March 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 December 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 January 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}