{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T09:09:05Z","timestamp":1743066545149,"version":"3.40.3"},"publisher-location":"Singapore","reference-count":36,"publisher":"Springer Nature Singapore","isbn-type":[{"type":"print","value":"9789819786916"},{"type":"electronic","value":"9789819786923"}],"license":[{"start":{"date-parts":[[2024,11,1]],"date-time":"2024-11-01T00:00:00Z","timestamp":1730419200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,1]],"date-time":"2024-11-01T00:00:00Z","timestamp":1730419200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-97-8692-3_15","type":"book-chapter","created":{"date-parts":[[2024,10,31]],"date-time":"2024-10-31T14:03:04Z","timestamp":1730383384000},"page":"206-219","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Variational Capsules for Image Analysis and Synthesis"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-4812-7625","authenticated-orcid":false,"given":"Yuguang","family":"Zhang","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5866-2283","authenticated-orcid":false,"given":"Huaibo","family":"Huang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,1]]},"reference":[{"key":"15_CR1","doi-asserted-by":"crossref","unstructured":"Bao, J., Chen, D., Wen, F., Li, H., Hua, G.: CVAE-GAN: fine-grained image generation through asymmetric training. In: ICCV (2017)","DOI":"10.1109\/ICCV.2017.299"},{"key":"15_CR2","doi-asserted-by":"crossref","unstructured":"Bao, J., Chen, D., Wen, F., Li, H., Hua, G.: Towards open-set identity preserving face synthesis. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00702"},{"key":"15_CR3","unstructured":"Bruna, J., Sprechmann, P., LeCun, Y.: Super-resolution with deep convolutional sufficient statistics. In: ICLR (2016)"},{"key":"15_CR4","doi-asserted-by":"crossref","unstructured":"Ding, H., Zhou, H., Zhou, S.K., Chellappa, R.: A deep cascade network for unaligned face attribute classification. In: AAAI (2018)","DOI":"10.1609\/aaai.v32i1.12303"},{"key":"15_CR5","doi-asserted-by":"crossref","unstructured":"Esser, P., Rombach, R., Ommer, B.: Taming transformers for high-resolution image synthesis. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.01268"},{"key":"15_CR6","unstructured":"Fu, C., Wu, X., Hu, Y., Huang, H., He, R.: Dual variational generation for low-shot heterogeneous face recognition. In: NeurIPS (2019)"},{"key":"15_CR7","unstructured":"Fu, C., Wu, X., Hu, Y., Huang, H., He, R.: Dvg-face: dual variational generation for heterogeneous face recognition. IEEE TPAMI PP(99), 1\u20131 (2021)"},{"key":"15_CR8","unstructured":"Goodfellow, I., Pouget-Abadie, J., Mirza, M., Xu, B., Warde-Farley, D., Ozair, S., Courville, A., Bengio, Y.: Generative adversarial nets. In: NIPS (2014)"},{"key":"15_CR9","doi-asserted-by":"crossref","unstructured":"Hand, E.M., Chellappa, R.: Attributes for improved attributes: a multi-task network utilizing implicit and explicit relationships for facial attribute classification. In: AAAI (2017)","DOI":"10.1609\/aaai.v31i1.11229"},{"key":"15_CR10","doi-asserted-by":"crossref","unstructured":"Hinton, G.E., Krizhevsky, A., Wang, S.D.: Transforming auto-encoders. In: ICANN (2011)","DOI":"10.1007\/978-3-642-21735-7_6"},{"key":"15_CR11","unstructured":"Hinton, G.E., Sabour, S., Frosst, N.: Matrix capsules with EM routing. In: ICLR (2018)"},{"key":"15_CR12","unstructured":"Ho, J., Jain, A., Abbeel, P.: Denoising diffusion probabilistic models. In: NIPS (2020)"},{"key":"15_CR13","unstructured":"Huang, H., Li, Z., He, R., Sun, Z., Tan, T.: Introvae: introspective variational autoencoders for photographic image synthesis. In: NIPS (2018)"},{"key":"15_CR14","doi-asserted-by":"crossref","unstructured":"Johnson, J., Alahi, A., Fei-Fei, L.: Perceptual losses for real-time style transfer and super-resolution. In: ECCV (2016)","DOI":"10.1007\/978-3-319-46475-6_43"},{"key":"15_CR15","doi-asserted-by":"crossref","unstructured":"Kim, G., Kwon, T., Ye, J.C.: Diffusionclip: Text-guided diffusion models for robust image manipulation. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.00246"},{"key":"15_CR16","unstructured":"Kingma, D.P., Welling, M.: Auto-encoding variational Bayes. In: ICLR (2014)"},{"key":"15_CR17","unstructured":"Lample, G., Zeghidour, N., Usunier, N., Bordes, A., Denoyer, L., et\u00a0al.: Fader networks: manipulating images by sliding attributes. In: NIPS (2017)"},{"issue":"11","key":"15_CR18","doi-asserted-by":"publisher","first-page":"2278","DOI":"10.1109\/5.726791","volume":"86","author":"Y LeCun","year":"1998","unstructured":"LeCun, Y., Bottou, L., Bengio, Y., Haffner, P.: Gradient-based learning applied to document recognition. Proc. IEEE 86(11), 2278\u20132324 (1998)","journal-title":"Proc. IEEE"},{"key":"15_CR19","doi-asserted-by":"crossref","unstructured":"Ledig, C., Theis, L., Huszar, F., Caballero, J., Cunningham, A., Acosta, A., Aitken, A., Tejani, A., Totz, J., Wang, Z., Shi, W.: Photo-realistic single image super-resolution using a generative adversarial network. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.19"},{"key":"15_CR20","doi-asserted-by":"crossref","unstructured":"Liu, Z., Luo, P., Wang, X., Tang, X.: Deep learning face attributes in the wild. In: ICCV (2015)","DOI":"10.1109\/ICCV.2015.425"},{"key":"15_CR21","doi-asserted-by":"crossref","unstructured":"Mao, X., Li, Q., Xie, H., Lau, R.Y., Wang, Z., Smolley, S.P.: Least squares generative adversarial networks. In: ICCV (2017)","DOI":"10.1109\/ICCV.2017.304"},{"key":"15_CR22","unstructured":"Mirza, M., Osindero, S.: Conditional generative adversarial nets. In: NIPSW (2014)"},{"key":"15_CR23","unstructured":"van\u00a0den Oord, A., Kalchbrenner, N., Espeholt, L., Vinyals, O., Graves, A., et\u00a0al.: Conditional image generation with pixelcnn decoders. In: NIPS (2016)"},{"key":"15_CR24","unstructured":"Perarnau, G., van\u00a0de Weijer, J., Raducanu, B., \u00c1lvarez, J.M.: Invertible conditional gans for image editing. In: NIPSW (2016)"},{"key":"15_CR25","doi-asserted-by":"crossref","unstructured":"Preechakul, K., Chatthee, N., Wizadwongsa, S., Suwajanakorn, S.: Diffusion autoencoders: toward a meaningful and decodable representation. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.01036"},{"key":"15_CR26","unstructured":"Rezende, D.J., Mohamed, S., Wierstra, D.: Stochastic backpropagation and approximate inference in deep generative models. In: ICML (2014)"},{"key":"15_CR27","doi-asserted-by":"crossref","unstructured":"Rudd, E.M., G\u00fcnther, M., Boult, T.E.: Moon: a mixed objective optimization network for the recognition of facial attributes. In: ECCV (2016)","DOI":"10.1007\/978-3-319-46454-1_2"},{"key":"15_CR28","unstructured":"Sabour, S., Frosst, N., Hinton, G.E.: Dynamic routing between capsules. In: NIPS (2017)"},{"key":"15_CR29","doi-asserted-by":"crossref","unstructured":"Shu, Z., Yumer, E., Hadap, S., Sunkavalli, K., Shechtman, E., Samaras, D.: Neural face editing with intrinsic image disentangling. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.578"},{"key":"15_CR30","unstructured":"Van Den\u00a0Oord, A., Vinyals, O., et\u00a0al.: Neural discrete representation learning. In: NIPS (2017)"},{"key":"15_CR31","unstructured":"Van\u00a0Oord, A., Kalchbrenner, N., Kavukcuoglu, K.: Pixel recurrent neural networks. In: ICML (2016)"},{"key":"15_CR32","doi-asserted-by":"crossref","unstructured":"Wang, L., Yang, S., Liu, S., Chen, Y.c.: Not all steps are created equal: selective diffusion distillation for image manipulation. In: ICCV (2023)","DOI":"10.1109\/ICCV51070.2023.00687"},{"key":"15_CR33","doi-asserted-by":"crossref","unstructured":"Wang, T.C., Liu, M.Y., Zhu, J.Y., Tao, A., Kautz, J., Catanzaro, B.: High-resolution image synthesis and semantic manipulation with conditional GANs. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00917"},{"key":"15_CR34","doi-asserted-by":"crossref","unstructured":"Yan, X., Yang, J., Sohn, K., Lee, H.: Attribute2image: Conditional image generation from visual attributes. In: ECCV (2016)","DOI":"10.1007\/978-3-319-46493-0_47"},{"key":"15_CR35","doi-asserted-by":"crossref","unstructured":"Zhan, F., Yu, Y., Wu, R., Zhang, J., Cui, K., Zhang, C., Lu, S.: Auto-regressive image synthesis with integrated quantization. In: ECCV (2022)","DOI":"10.1007\/978-3-031-19787-1_7"},{"key":"15_CR36","unstructured":"Zhang, Y., et\u00a0al.: Image Analysis. Walter de Gruyter GmbH & Co KG (2017)"}],"container-title":["Lecture Notes in Computer Science","Pattern Recognition and Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-97-8692-3_15","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,31]],"date-time":"2024-10-31T14:24:51Z","timestamp":1730384691000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-97-8692-3_15"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,1]]},"ISBN":["9789819786916","9789819786923"],"references-count":36,"URL":"https:\/\/doi.org\/10.1007\/978-981-97-8692-3_15","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024,11,1]]},"assertion":[{"value":"1 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"PRCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Chinese Conference on Pattern Recognition and Computer Vision  (PRCV)","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Urumqi","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18 October 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"7","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ccprcv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/2024.prcv.cn\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}