{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2023,3,22]],"date-time":"2023-03-22T04:34:36Z","timestamp":1679459676015},"reference-count":37,"publisher":"Springer Science and Business Media LLC","issue":"9","license":[{"start":{"date-parts":[[2022,9,26]],"date-time":"2022-09-26T00:00:00Z","timestamp":1664150400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,9,26]],"date-time":"2022-09-26T00:00:00Z","timestamp":1664150400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2023,4]]},"DOI":"10.1007\/s11042-022-13899-5","type":"journal-article","created":{"date-parts":[[2022,9,26]],"date-time":"2022-09-26T10:03:08Z","timestamp":1664186588000},"page":"13579-13594","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Human face generation from textual description via style mapping and manipulation"],"prefix":"10.1007","volume":"82","author":[{"given":"Shantanu","family":"Todmal","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ashish","family":"Mule","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Devang","family":"Bhagwat","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tanmoy","family":"Hazra","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bhupendra","family":"Singh","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,9,26]]},"reference":[{"key":"13899_CR1","doi-asserted-by":"crossref","unstructured":"Abdal YQR Wonka P (2019) \u201cIm- age2StyleGAN: how to embed images into the style- GAN latent space?\u201d In: ICCV.","DOI":"10.1109\/ICCV.2019.00453"},{"key":"13899_CR2","unstructured":"Barratt S, Sharma R (2018) \u201cA note on the inception score\u201d. In: arXiv preprint arXiv:1801.01973"},{"key":"13899_CR3","doi-asserted-by":"crossref","unstructured":"Bau D et al. (2019) \u201cSeeing what a Gan cannot generate\u201d. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision. pp. 4502\u20134511.","DOI":"10.1109\/ICCV.2019.00460"},{"key":"13899_CR4","unstructured":"Chen X et al. (2019) \u201cFTGAN: a fully-trained generative adversarial networks for text to face generation\u201d. In: arXiv preprint arXiv:1904.05729."},{"key":"13899_CR5","doi-asserted-by":"crossref","unstructured":"Garg K et al. (2020) \u201cPerception GAN: real-world image construction from provided text through perceptual understanding\u201d. In: 2020 Joint 9th International Conference on Informatics, Electronics & Vision (ICIEV) and 2020 4th International Conference on Imaging, Vision & Pattern Recognition (icIVPR). IEEE ,pp. 1\u20137.","DOI":"10.1109\/ICIEVicIVPR48672.2020.9306618"},{"key":"13899_CR6","unstructured":"Goodfellow IJ et al. (2014) \u201cGenerative adversarial net- works\u201d. In: arXiv preprint arXiv:1406.2661."},{"key":"13899_CR7","unstructured":"Heusel M et al. (2017) \u201cGans trained by a two time-scale update rule converge to a local Nash equilibrium\u201d. In: arXiv preprint arXiv:1706.08500."},{"key":"13899_CR8","doi-asserted-by":"crossref","unstructured":"Karnewar A and Wang O (2020) \u201cMsg-Gan: multi- scale gradients for generative adversarial networks\u201d. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7799\u20137808.","DOI":"10.1109\/CVPR42600.2020.00782"},{"key":"13899_CR9","unstructured":"Karras T et al. (2017) \u201cProgressive growing of gans for improved quality, stability, and variation\u201d. In: arXiv preprint arXiv:1710.10196."},{"key":"13899_CR10","doi-asserted-by":"crossref","unstructured":"Karras T, S Laine, Aila T (2019) \u201cA style- based generator architecture for generative adversarial networks\u201d. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4401\u20134410.","DOI":"10.1109\/CVPR.2019.00453"},{"key":"13899_CR11","doi-asserted-by":"crossref","unstructured":"Karras T et al. (2020) \u201cAnalyzing and improving the image quality of StyleGAN\u201d. In: Proc CVPR.","DOI":"10.1109\/CVPR42600.2020.00813"},{"key":"13899_CR12","unstructured":"Kettunen M, H\u00e4rk\u00f6nen E, Lehtinen J (2019). \u201cE-LPIPS: robust perceptual image similarity via random transformation ensembles\u201d. In: arXiv preprint arXiv:1906.03973"},{"key":"13899_CR13","doi-asserted-by":"publisher","unstructured":"Khan M et al. (2020) \u201cA Realistic Image Generation of Face From Text Description Using the Fully Trained Generative Adversarial Networks\u201d. In: IEEE Access PP, pp. 1\u20131. https:\/\/doi.org\/10.1109\/ACCESS.2020.3015656.","DOI":"10.1109\/ACCESS.2020.3015656"},{"key":"13899_CR14","first-page":"1097","volume":"25","author":"A Krizhevsky","year":"2012","unstructured":"Krizhevsky A, Sutskever I, Hinton GE (2012) Imagenet classification with deep convolutional neural networks. Adv Neural Inf Proces Syst 25:1097\u20131105","journal-title":"Adv Neural Inf Proces Syst"},{"key":"13899_CR15","doi-asserted-by":"crossref","unstructured":"Lee C-H et al. (2020) \u201cMaskGAN: towards diverse and interactive facial image manipulation\u201d. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR).","DOI":"10.1109\/CVPR42600.2020.00559"},{"key":"13899_CR16","unstructured":"Li B et al. (2019) \u201cControllable text-to-image generation\u201d. In: arXiv preprint arXiv:1909.07083."},{"key":"13899_CR17","unstructured":"Mao J et al. (2015) \u201cDeep captioning with multi- modal recurrent neural networks (m-RNN)\u201d. In: ICLR."},{"key":"13899_CR18","doi-asserted-by":"crossref","unstructured":"Nasir OR et al (2019) \u201cText2FaceGAN: face generation from fine grained textual descriptions\u201d. In: 2019 IEEE Fifth International Conference on Multime- dia Big Data (BigMM). IEEE, pp. 58\u201367.","DOI":"10.1109\/BigMM.2019.00-42"},{"key":"13899_CR19","doi-asserted-by":"crossref","unstructured":"Patashnik O et al. (2021) \u201cStyleclip: text-driven manipulation of stylegan imagery\u201d. In: arXiv preprint arXiv:2103.17249","DOI":"10.1109\/ICCV48922.2021.00209"},{"key":"13899_CR20","unstructured":"Radford A, Metz L, Chintala S (2015) \u201cUnsupervised representation learning with deep convolutional generative adversarial networks\u201d. In: arXiv preprint arXiv:1511.06434."},{"key":"13899_CR21","unstructured":"Radford A et al. (2021) \u201cLearning Transferable Visual Models From Natural Language Supervision\u201d. In: arXiv preprint arXiv:2103.00020."},{"key":"13899_CR22","unstructured":"Reed S et al. (2016) \u201cGenerative adversarial text to image synthesis\u201d. In: International Conference on Machine Learning. PMLR, pp. 1060\u20131069."},{"key":"13899_CR23","doi-asserted-by":"crossref","unstructured":"Richardson E et al. (2020) \u201cEncoding in style: a StyleGAN encoder for image-to-image translation\u201d. In: arXiv preprint arXiv:2008.00951.","DOI":"10.1109\/CVPR46437.2021.00232"},{"key":"13899_CR24","unstructured":"Salimans T et al. (2016) \u201cImproved techniques for training gans\u201d. In: arXiv preprint arXiv:1606.03498"},{"key":"13899_CR25","doi-asserted-by":"crossref","unstructured":"Shen Y et al. (2020) \u201cInterpreting the latent space of gans for semantic face editing\u201d. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9243\u20139252.","DOI":"10.1109\/CVPR42600.2020.00926"},{"key":"13899_CR26","unstructured":"Simonyan K, Zisserman A (2014) \u201cVery deep convolutional networks for large-scale image recognition\u201d. In: arXiv preprint arXiv:1409.1556."},{"key":"13899_CR27","doi-asserted-by":"crossref","unstructured":"Szegedy C et al. (2016) \u201cRethinking the inception architecture for computer vision\u201d. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 2818\u20132826.","DOI":"10.1109\/CVPR.2016.308"},{"key":"13899_CR28","unstructured":"Tao X et al. 2018 \u201cAttngan: fine-grained text to im- age generation with attentional generative adversarial networks\u201d. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 1316\u20131324."},{"key":"13899_CR29","unstructured":"Tao M et al. (2020) \u201cDf-Gan: deep fusion generative adversarial networks for text-to-image synthesis\u201d. In: arXiv preprint arXiv:2008.05865."},{"key":"13899_CR30","doi-asserted-by":"crossref","unstructured":"Wang T, Zhang T, and Lovell B (2021) \u201cFaces a la carte: text-to-face generation via attribute disentanglement\u201d. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 3380\u20133388.","DOI":"10.1109\/WACV48630.2021.00342"},{"key":"13899_CR31","unstructured":"Xia W et al. (2021) \u201cGAN Inversion: A Survey\u201d. In: arXiv preprint arXiv:2101.05278."},{"key":"13899_CR32","doi-asserted-by":"crossref","unstructured":"Xia W et al. (2021) \u201cTediGAN: text-guided diverse face image generation and manipulation\u201d. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","DOI":"10.1109\/CVPR46437.2021.00229"},{"issue":"9","key":"13899_CR33","doi-asserted-by":"publisher","first-page":"2251","DOI":"10.1109\/TPAMI.2018.2857768","volume":"41","author":"Y Xian","year":"2018","unstructured":"Xian Y et al (2018) Zero-shot learning\u2014a comprehensive evaluation of the good, the bad and the ugly. IEEE Trans Pattern Anal Mach Intell 41(9):2251\u20132265","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"13899_CR34","unstructured":"Yongyi L, Tai Y-W, Tang C-K(2018) \u201cAttribute-guided face generation using conditional cyclegan\u201d. In: Proceedings of the European conference on computer vision (ECCV), pp. 282\u2013297."},{"issue":"8","key":"13899_CR35","doi-asserted-by":"publisher","first-page":"1947","DOI":"10.1109\/TPAMI.2018.2856256","volume":"41","author":"H Zhang","year":"2018","unstructured":"Zhang H et al (2018) Stackgan++: realistic image syn- thesis with stacked generative adversarial networks. IEEE Trans Pattern Anal Mach Intell 41(8):1947\u20131962","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"13899_CR36","doi-asserted-by":"crossref","unstructured":"Zhang R et al. (2018) \u201cThe unreasonable effectiveness of deep features as a perceptual metric\u201d. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 586\u2013595.","DOI":"10.1109\/CVPR.2018.00068"},{"key":"13899_CR37","doi-asserted-by":"crossref","unstructured":"Zhu M et al. (2019) \u201cDm-Gan: dynamic memory generative adversarial networks for text-to-image synthesis\u201d. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5802\u20135810.","DOI":"10.1109\/CVPR.2019.00595"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-13899-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-022-13899-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-13899-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,3,21]],"date-time":"2023-03-21T10:32:56Z","timestamp":1679394776000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-022-13899-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,9,26]]},"references-count":37,"journal-issue":{"issue":"9","published-print":{"date-parts":[[2023,4]]}},"alternative-id":["13899"],"URL":"https:\/\/doi.org\/10.1007\/s11042-022-13899-5","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,9,26]]},"assertion":[{"value":"24 June 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 June 2022","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 September 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 September 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declaration"}},{"value":"We declare that there is no conflict of interest for this research submission.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}