{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,9]],"date-time":"2026-06-09T06:51:25Z","timestamp":1780987885131,"version":"3.54.1"},"reference-count":42,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"12","license":[{"start":{"date-parts":[[2020,12,1]],"date-time":"2020-12-01T00:00:00Z","timestamp":1606780800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,12,1]],"date-time":"2020-12-01T00:00:00Z","timestamp":1606780800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,12,1]],"date-time":"2020-12-01T00:00:00Z","timestamp":1606780800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"National Key R&amp;D Program of China","award":["2019YFF0303300"],"award-info":[{"award-number":["2019YFF0303300"]}]},{"name":"Subject II","award":["2019YFF0303302"],"award-info":[{"award-number":["2019YFF0303302"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61802026"],"award-info":[{"award-number":["61802026"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61906018"],"award-info":[{"award-number":["61906018"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Science and Technology Program of the Headquarters of State Grid Corporation of China","award":["5200-201918255A-0-0-00"],"award-info":[{"award-number":["5200-201918255A-0-0-00"]}]},{"DOI":"10.13039\/501100013314","name":"Higher Education Discipline Innovation Project","doi-asserted-by":"publisher","award":["B08004"],"award-info":[{"award-number":["B08004"]}],"id":[{"id":"10.13039\/501100013314","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Multimedia"],"published-print":{"date-parts":[[2020,12]]},"DOI":"10.1109\/tmm.2020.2972856","type":"journal-article","created":{"date-parts":[[2020,2,11]],"date-time":"2020-02-11T02:02:42Z","timestamp":1581386562000},"page":"3075-3087","source":"Crossref","is-referenced-by-count":44,"title":["Exploring Global and Local Linguistic Representations for Text-to-Image Synthesis"],"prefix":"10.1109","volume":"22","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3543-6272","authenticated-orcid":false,"given":"Ruifan","family":"Li","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6423-3167","authenticated-orcid":false,"given":"Ning","family":"Wang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4798-4233","authenticated-orcid":false,"given":"Fangxiang","family":"Feng","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Guangwei","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6423-3167","authenticated-orcid":false,"given":"Xiaojie","family":"Wang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref39","first-page":"740","article-title":"Microsoft COCO: Common objects in context","author":"lin","year":"0","journal-title":"Proc Eur Conf Comput Vision"},{"key":"ref38","article-title":"The caltech-UCSD birds-200-2011 dataset","author":"wah","year":"2011"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2908352"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2898777"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00133"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00833"},{"key":"ref37","article-title":"Geometric GAN","author":"lim","year":"2017"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref35","first-page":"6594","article-title":"Modulating early visual processing by language","author":"vries","year":"0","journal-title":"Proc Advances Neural Inf Process Syst"},{"key":"ref34","article-title":"Large scale GAN training for high fidelity natural image synthesis","author":"brock","year":"2019","journal-title":"Proc Int Conf Learn Representations"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/3077136.3080842"},{"key":"ref40","first-page":"2234","article-title":"Improved techniques for training GANs","author":"salimans","year":"0","journal-title":"Proc Advances Neural Inf Process Syst"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2911456"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2912714"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2018\/592"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2915033"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2017.2751140"},{"key":"ref16","first-page":"2672","article-title":"Generative adversarial nets","author":"goodfellow","year":"0","journal-title":"Proc Advances Neural Inf Process Syst"},{"key":"ref17","article-title":"Conditional generative adversarial nets","author":"mirza","year":"2014"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/78.650093"},{"key":"ref19","article-title":"Towards principled methods for training generative adversarial networks","author":"arjovsky","year":"0","journal-title":"Proc Int Conf Learn Representations"},{"key":"ref28","first-page":"5767","article-title":"Improved training of Wasserstein GANs","author":"gulrajani","year":"2017","journal-title":"Proc Advances Neural Inf Process Syst"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2856256"},{"key":"ref27","article-title":"Wasserstein GAN","author":"arjovsky","year":"2017"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.629"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00143"},{"key":"ref29","article-title":"Spectral normalization for generative adversarial networks","author":"miyato","year":"0","journal-title":"Proc Int Conf Learn Representations"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00649"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01245"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00160"},{"key":"ref2","first-page":"217","article-title":"Learning what and where to draw","author":"reed","year":"0","journal-title":"Proc Advances Neural Inf Process Syst"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2014.12.020"},{"key":"ref1","first-page":"1060","article-title":"Generative adversarial text to image synthesis","author":"reed","year":"0","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref20","article-title":"Unsupervised representation learning with deep convolutional generative adversarial networks","author":"radford","year":"0","journal-title":"Proc Int Conf Learn Representations"},{"key":"ref22","article-title":"Energy-based generative adversarial networks","author":"zhao","year":"0","journal-title":"Proc Int Conf Learn Representations"},{"key":"ref21","first-page":"1486","article-title":"Deep generative image models using a Laplacian pyramid of adversarial networks","author":"denton","year":"2015","journal-title":"Proc Advances Neural Inf Process Syst"},{"key":"ref42","article-title":"Adam: A method for stochastic optimization","author":"kingma","year":"0","journal-title":"Proc Int Conf Learn Representations"},{"key":"ref24","first-page":"2642","article-title":"Conditional image synthesis with auxiliary classifier GANs","author":"odena","year":"0","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref41","first-page":"6626","article-title":"GANs trained by a two time-scale update rule converge to a nash equilibrium","author":"heusel","year":"0","journal-title":"Proc Advances Neural Inf Process Syst"},{"key":"ref23","article-title":"BEGAN: Boundary equilibrium generative adversarial networks","author":"berthelot","year":"2017"},{"key":"ref26","article-title":"cGANs with projection discriminator","author":"miyato","year":"0","journal-title":"Proc Int Conf Learn Representations"},{"key":"ref25","first-page":"394","article-title":"Binary generative adversarial networks for image retrieval","author":"song","year":"0","journal-title":"Proc 32nd AAAI Conf Artif Intell"}],"container-title":["IEEE Transactions on Multimedia"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6046\/9263048\/08989803.pdf?arnumber=8989803","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,4,27]],"date-time":"2022-04-27T15:57:39Z","timestamp":1651075059000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8989803\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,12]]},"references-count":42,"journal-issue":{"issue":"12"},"URL":"https:\/\/doi.org\/10.1109\/tmm.2020.2972856","relation":{},"ISSN":["1520-9210","1941-0077"],"issn-type":[{"value":"1520-9210","type":"print"},{"value":"1941-0077","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,12]]}}}