{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,20]],"date-time":"2025-11-20T19:03:04Z","timestamp":1763665384694,"version":"3.37.3"},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"12","license":[{"start":{"date-parts":[[2024,2,9]],"date-time":"2024-02-09T00:00:00Z","timestamp":1707436800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,2,9]],"date-time":"2024-02-09T00:00:00Z","timestamp":1707436800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"Nation Natural Science Foundation of China","doi-asserted-by":"crossref","award":["62072150"],"award-info":[{"award-number":["62072150"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"name":"Shaanxi Provincial Key Research and Development Program","award":["2023-YBGY-148"],"award-info":[{"award-number":["2023-YBGY-148"]}]},{"name":"Henan Provincial Science and Technology Plan Project","award":["222102210240"],"award-info":[{"award-number":["222102210240"]}]},{"name":"Henan Provincial Higher Education Key Scientific Research Project","award":["22B520012","22A510017"],"award-info":[{"award-number":["22B520012","22A510017"]}]},{"name":"Shaanxi Provincial Social Science Fund Project","award":["2022M007"],"award-info":[{"award-number":["2022M007"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2024,12]]},"DOI":"10.1007\/s00371-024-03260-2","type":"journal-article","created":{"date-parts":[[2024,2,9]],"date-time":"2024-02-09T09:02:32Z","timestamp":1707469352000},"page":"8639-8651","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Masked cross-attention and multi-head channel attention guiding single-stage generative adversarial networks for text-to-image generation"],"prefix":"10.1007","volume":"40","author":[{"given":"Shouming","family":"Hou","sequence":"first","affiliation":[]},{"given":"Ziying","family":"Li","sequence":"additional","affiliation":[]},{"given":"Kuikui","family":"Wu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0007-4278-0868","authenticated-orcid":false,"given":"Yinggang","family":"Zhao","sequence":"additional","affiliation":[]},{"given":"Hui","family":"Li","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,2,9]]},"reference":[{"key":"3260_CR1","first-page":"9459","volume":"33","author":"P Lewis","year":"2020","unstructured":"Lewis, P., Perez, E., Piktus, A., et al.: Retrieval-augmented generation for knowledge-intensive nlp tasks. Adv. Neural. Inf. Process. Syst. 33, 9459\u20139474 (2020)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"3260_CR2","first-page":"15316","volume":"34","author":"Y Tang","year":"2021","unstructured":"Tang, Y., Han, K., Xu, C., et al.: Augmented shortcuts for vision transformers. Adv. Neural. Inf. Process. Syst. 34, 15316\u201315327 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"issue":"2","key":"3260_CR3","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3439729","volume":"54","author":"Y Deldjoo","year":"2021","unstructured":"Deldjoo, Y., Noia, T.D., Merra, F.A.: A survey on adversarial recommender systems: from attack\/defense strategies to generative adversarial networks. ACM Comput. Surv. (CSUR) 54(2), 1\u201338 (2021)","journal-title":"ACM Comput. Surv. (CSUR)"},{"issue":"20","key":"3260_CR4","doi-asserted-by":"publisher","first-page":"3860","DOI":"10.3390\/math10203860","volume":"10","author":"H Kim","year":"2022","unstructured":"Kim, H., Kim, J., Yang, H.: A GAN-based face rotation for artistic portraits. Mathematics 10(20), 3860 (2022)","journal-title":"Mathematics"},{"key":"3260_CR5","unstructured":"Ramesh, A., Pavlov, M., Goh, G., et al.: Zero-shot text-to-image generation, international conference on machine learning. PMLR, 8821\u20138831, (2021)"},{"key":"3260_CR6","unstructured":"Ramesh, A., Dhariwal, P., Nichol, A., et al.: Hierarchical text-conditional image generation with CLIP latents. arXiv, 2022(2022-04-12)[2023-03-20]."},{"key":"3260_CR7","first-page":"2672","volume":"204","author":"I Goodfellow","year":"2014","unstructured":"Goodfellow, I., Pouget-Abadie, J., Mirza, M., et al.: Generative adversarial nets. In advances in neural information processing systems 27. Annu. Conf. Neural Info Process. Syst. 204, 2672\u20132680 (2014)","journal-title":"Annu. Conf. Neural Info Process. Syst."},{"key":"3260_CR8","unstructured":"Mirza, M., Osindero, S.: Conditional generative adversarial nets. arXiv preprint arXiv:1411.1784, (2014)"},{"key":"3260_CR9","unstructured":"Zhang, H., Xu, T., Li, H., et al.: StackGAN++: realistic image synthesis with stacked generative adversarial networks. arXiv, 2018(2018-06-27)[2023-03-20]"},{"key":"3260_CR10","doi-asserted-by":"crossref","unstructured":"Tan, H., Yin, B., Wei, K., Liu, X., Li, X.: ALR-GAN: Adaptive Layout Refinement for Text-to-Image Synthesis. IEEE Trans. Multimedia. 25, 8620\u20138631 (2023)","DOI":"10.1109\/TMM.2023.3238554"},{"issue":"6","key":"3260_CR11","doi-asserted-by":"publisher","first-page":"5371","DOI":"10.1007\/s11063-022-10866-x","volume":"54","author":"J Zhu","year":"2022","unstructured":"Zhu, J., Li, Z., Wei, J., et al.: PBGN: phased bidirectional generation network in text-to-image synthesis. Neural. Process. Lett. 54(6), 5371\u20135391 (2022)","journal-title":"Neural. Process. Lett."},{"key":"3260_CR12","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1007\/978-981-16-9012-9_14","volume-title":"Sustainable advanced computing","author":"V Agarwal","year":"2022","unstructured":"Agarwal, V., Sharma, S., Aurelia, S., et al.: Deep learning techniques to improve radio resource management in vehicular communication network. In: Biswas, S.K. (ed.) Sustainable advanced computing, pp. 161\u2013171. Springer, Singapore (2022)"},{"issue":"2","key":"3260_CR13","first-page":"25","volume":"14","author":"V Agarwal","year":"2022","unstructured":"Agarwal, V., Sharma, S.: EMVD: efficient multitype vehicle detection algorithm using deep learning approach in vehicular communication network for radio resource management. Int. J. Image Gr. Sign. Process. 14(2), 25\u201337 (2022)","journal-title":"Int. J. Image Gr. Sign. Process."},{"key":"3260_CR14","unstructured":"Karras, T., Laine, S., Aittala, M., et al.: Analyzing and improving the image quality of stylegan. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition"},{"key":"3260_CR15","doi-asserted-by":"crossref","unstructured":"Wang, Y., Qiu, H., Qin, C.: Conditional deformable image registration with spatially-variant and adaptive regularization. arXiv, 2023(2023-03-19)[2023-03-23]","DOI":"10.1109\/ISBI53787.2023.10230464"},{"key":"3260_CR16","unstructured":"Chen, L., Lu, X., Zhang, J., et al.: Hinet: half instance normalization network for image restoration. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition"},{"key":"3260_CR17","unstructured":"Xu, T., Zhang, P., Huang, Q., et al.: AttnGAN: fine-grained text to image generation with attentional generative adversarial networks[Z\/OL]. arXiv, 2017(2017-11-28)[2023-03-20]."},{"key":"3260_CR18","unstructured":"Zhang, H., Xu, T., Li, H., et al.: Stackgan: text to photo-realistic image synthesis with stacked generative adversarial networks, In: Proceedings of the IEEE international conference on computer vision"},{"key":"3260_CR19","unstructured":"Karras, T., Aila, T., Laine, S., et al.: Progressive growing of GANs for improved quality, stability, and variation. arXiv, 2018 (2018-02-26)[2022-10-09]"},{"issue":"6","key":"3260_CR20","first-page":"3371","volume":"15","author":"V Agarwal","year":"2023","unstructured":"Agarwal, V., Sharma, S.: DQN Algorithm for network resource management in vehicular communication network. Int. J. Inf. Technol. 15(6), 3371\u20133379 (2023)","journal-title":"Int. J. Inf. Technol."},{"key":"3260_CR21","doi-asserted-by":"publisher","first-page":"103267","DOI":"10.1016\/j.dsp.2021.103267","volume":"120","author":"S Huang","year":"2022","unstructured":"Huang, S., Chen, Y.: Generative adversarial networks with adaptive semantic normalization for text-to-image synthesis. Digit. Sign. Process. 120, 103267 (2022)","journal-title":"Digit. Sign. Process."},{"key":"3260_CR22","unstructured":"Liao, W., Hu, K., Yang, M. Y., et al.: Text to image generation with semantic-spatial aware gan. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition"},{"issue":"4","key":"3260_CR23","first-page":"1283","volume":"39","author":"Y Zhang","year":"2022","unstructured":"Zhang, Y., Han, S., Zhang, Z., et al.: CF-GAN: cross-domain feature fusion generative adversarial network for text-to-image synthesis. Visual Comput. 39(4), 1283\u20131293 (2022)","journal-title":"Visual Comput."},{"key":"3260_CR24","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1016\/j.neunet.2021.01.023","volume":"138","author":"D Peng","year":"2021","unstructured":"Peng, D., Yang, W., Liu, C., et al.: SAM-GAN: self-attention supporting multi-stage generative adversarial networks for text-to-image synthesis. Neural Netw.Netw. 138, 57\u201367 (2021)","journal-title":"Neural Netw.Netw."},{"key":"3260_CR25","unstructured":"Li, B., Qi, X., Lukasiewicz, T., et al.: Controllable text-to-image generation. arXiv, 2019 (2019-12-19)[2023-05-04]"},{"key":"3260_CR26","doi-asserted-by":"crossref","unstructured":"Schuster, M., Paliwal, K. K.: Bidirectional recurrent neural networks. IEEE Trans. Signal Process. 45(11), 2673\u20132681 (1997)","DOI":"10.1109\/78.650093"},{"key":"3260_CR27","unstructured":"Vaswani, A., et al.: Attention is all you need. Adv. Neural Inf. Process. Syst. 30 (2017)"},{"key":"3260_CR28","unstructured":"Vinker, Y., Pajouheshgar, E., Bo, J. Y., et al.: Clipasso: Semantically-aware object sketching. arXiv preprint arXiv:2202.05822"},{"key":"3260_CR29","unstructured":"Lin, T. Y., Maire, M., Belongie, S., et al.: Microsoft COCO. In: common objects in context, european conference on computer vision. [2023-03-20]"},{"key":"3260_CR30","unstructured":"Szegedy, C., Vanhoucke, V., Ioffe, S.: Rethinking the inception architecture for computer vision, In: Proceedings of the IEEE conference on computer vision and pattern recognition"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-024-03260-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-024-03260-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-024-03260-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,12]],"date-time":"2024-11-12T09:10:23Z","timestamp":1731402623000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-024-03260-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,2,9]]},"references-count":30,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2024,12]]}},"alternative-id":["3260"],"URL":"https:\/\/doi.org\/10.1007\/s00371-024-03260-2","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"type":"print","value":"0178-2789"},{"type":"electronic","value":"1432-2315"}],"subject":[],"published":{"date-parts":[[2024,2,9]]},"assertion":[{"value":"29 December 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 February 2024","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}},{"value":"All authors agreed to participate in this paper.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent to participate"}},{"value":"Not applicable.","order":5,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}}]}}