{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,14]],"date-time":"2026-05-14T23:23:18Z","timestamp":1778800998067,"version":"3.51.4"},"reference-count":54,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Key-Area Research Development Program of Guangdong Province","award":["2019B121204008"],"award-info":[{"award-number":["2019B121204008"]}]},{"name":"Shenzhen Municipal Science and Technology Program","award":["JCYJ20170818141146428"],"award-info":[{"award-number":["JCYJ20170818141146428"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. on Image Process."],"published-print":{"date-parts":[[2020]]},"DOI":"10.1109\/tip.2020.3018224","type":"journal-article","created":{"date-parts":[[2020,8,27]],"date-time":"2020-08-27T23:00:32Z","timestamp":1598569232000},"page":"8622-8635","source":"Crossref","is-referenced-by-count":71,"title":["Deep Spatial Transformation for Pose-Guided Person Image Generation and Animation"],"prefix":"10.1109","volume":"29","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0178-4460","authenticated-orcid":false,"given":"Yurui","family":"Ren","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0140-0949","authenticated-orcid":false,"given":"Ge","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shan","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Thomas H.","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00524"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00519"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1111\/cgf.13632"},{"key":"ref32","article-title":"Everybody dance now","author":"chan","year":"2018","journal-title":"arXiv 1808 07371"},{"key":"ref31","article-title":"Video-to-video synthesis","author":"wang","year":"2018","journal-title":"arXiv 1808 06601"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00381"},{"key":"ref37","article-title":"Generating long sequences with sparse transformers","author":"child","year":"2019","journal-title":"arXiv 1904 10509"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01454"},{"key":"ref35","article-title":"Large scale GAN training for high fidelity natural image synthesis","author":"brock","year":"2018","journal-title":"arXiv 1809 11096"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00762"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00923"},{"key":"ref27","article-title":"CrowdPose: Efficient crowded scenes pose estimation and a new benchmark","author":"li","year":"2018","journal-title":"arXiv 1812 00324"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.01057"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00359"},{"key":"ref1","first-page":"406","article-title":"Pose guided person image generation","author":"ma","year":"2017","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00308"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46493-0_18"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00027"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.291"},{"key":"ref23","article-title":"FlowNet: Learning optical flow with convolutional networks","author":"fischer","year":"2015","journal-title":"arXiv 1504 06852"},{"key":"ref26","article-title":"OpenPose: Realtime multi-person 2D pose estimation using part affinity fields","author":"cao","year":"2018","journal-title":"arXiv 1812 08008"},{"key":"ref25","article-title":"DwNet: Dense warp-based network for pose-guided human video generation","author":"zablotskaia","year":"2019","journal-title":"arXiv 1910 09139"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.502"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.133"},{"key":"ref54","article-title":"FaceForensics: A large-scale video dataset for forgery detection in human faces","author":"r\u00f6ssler","year":"2018","journal-title":"arXiv 1803 09179"},{"key":"ref53","article-title":"ShapeNet: An information-rich 3D model repository","author":"chang","year":"2015","journal-title":"arXiv 1512 03012"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.124"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.81"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.143"},{"key":"ref12","first-page":"568","article-title":"Two-stream convolutional networks for action recognition in videos","author":"simonyan","year":"2014","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref13","first-page":"2017","article-title":"Spatial transformer networks","author":"jaderberg","year":"2015","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref14","first-page":"5998","article-title":"Attention is all you need","author":"vaswani","year":"2017","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref15","article-title":"Self-attention generative adversarial networks","author":"zhang","year":"2018","journal-title":"arXiv 1805 08318"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00813"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00356"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00577"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00771"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00245"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00246"},{"key":"ref6","first-page":"7137","article-title":"First order motion model for image animation","author":"siarohin","year":"2019","journal-title":"Advances in Neural IInformation Processing Systems"},{"key":"ref5","article-title":"Few-shot video-to-video synthesis","author":"wang","year":"2019","journal-title":"arXiv 1910 12713"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00600"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00248"},{"key":"ref49","first-page":"6626","article-title":"GANs trained by a two time-scale update rule converge to a local NASH equilibrium","author":"heusel","year":"2017","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref9","author":"goodfellow","year":"2016","journal-title":"Deep Learning"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.248"},{"key":"ref45","article-title":"Layer normalization","author":"ba","year":"2016","journal-title":"arXiv 1607 06450"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00068"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref42","first-page":"694","article-title":"Perceptual losses for real-time style transfer and super-resolution","author":"johnson","year":"2016","journal-title":"Proc Eur Conf Comput Vis"},{"key":"ref41","first-page":"2672","article-title":"Generative adversarial nets","author":"goodfellow","year":"2014","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.167"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00794"}],"container-title":["IEEE Transactions on Image Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/83\/8835130\/09178983.pdf?arnumber=9178983","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,4,27]],"date-time":"2022-04-27T14:38:48Z","timestamp":1651070328000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9178983\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020]]},"references-count":54,"URL":"https:\/\/doi.org\/10.1109\/tip.2020.3018224","relation":{},"ISSN":["1057-7149","1941-0042"],"issn-type":[{"value":"1057-7149","type":"print"},{"value":"1941-0042","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020]]}}}