{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,19]],"date-time":"2025-12-19T14:46:41Z","timestamp":1766155601689,"version":"3.46.0"},"reference-count":84,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"4","license":[{"start":{"date-parts":[[2025,4,1]],"date-time":"2025-04-01T00:00:00Z","timestamp":1743465600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"name":"JSPS KAKENHI","award":["JP21H03456","JP23K11141"],"award-info":[{"award-number":["JP21H03456","JP23K11141"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Neural Netw. Learning Syst."],"published-print":{"date-parts":[[2025,4]]},"DOI":"10.1109\/tnnls.2024.3404496","type":"journal-article","created":{"date-parts":[[2024,7,3]],"date-time":"2024-07-03T13:34:10Z","timestamp":1720013650000},"page":"7529-7541","source":"Crossref","is-referenced-by-count":4,"title":["ConcVAE: Conceptual Representation Learning"],"prefix":"10.1109","volume":"36","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4474-3995","authenticated-orcid":false,"given":"Ren","family":"Togo","sequence":"first","affiliation":[{"name":"Faculty of Information Science and Technology, Hokkaido University, Sapporo, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9260-0828","authenticated-orcid":false,"given":"Nao","family":"Nakagawa","sequence":"additional","affiliation":[{"name":"Graduate School of Information Science and Technology, Hokkaido University, Sapporo, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5332-8112","authenticated-orcid":false,"given":"Takahiro","family":"Ogawa","sequence":"additional","affiliation":[{"name":"Faculty of Information Science and Technology, Hokkaido University, Sapporo, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1496-1761","authenticated-orcid":false,"given":"Miki","family":"Haseyama","sequence":"additional","affiliation":[{"name":"Faculty of Information Science and Technology, Hokkaido University, Sapporo, Japan"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2784440"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR48806.2021.9413032"},{"key":"ref3","first-page":"159","article-title":"Fixing a broken ELBO","volume-title":"Proc. Int. Conf. Mach. Learn. (ICML)","author":"Alemi"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.279"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/S0042-6989(97)00121-1"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.50"},{"key":"ref7","first-page":"15435","article-title":"Explicitly disentangling image content from translation and rotation with spatial-VAE","volume-title":"Proc. Neural Inf. Process. Syst. (NeurIPS)","author":"Bepler"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2015.2496947"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.29172\/7c2a6982-6d72-4cd8-bba6-2fccb06a7011"},{"key":"ref10","first-page":"1","article-title":"Understanding disentangling in \u03b2-VAE","volume-title":"Proc. Neural Inf. Process. Syst. (NIPS) Workshop","author":"Burgess"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2017.2690575"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/3641289"},{"volume-title":"Anime-Face-Dataset","year":"2018","author":"Chao","key":"ref13"},{"key":"ref14","first-page":"2610","article-title":"Isolating sources of disentanglement in variational autoencoders","volume-title":"Proc. Neural Inf. Process. Syst. (NIPS)","author":"Chen"},{"key":"ref15","first-page":"2172","article-title":"InfoGAN: Interpretable representation learning by information maximizing generative adversarial nets","volume-title":"Proc. Adv. Neural Inf. Process. Syst. (NIPS)","author":"Chen"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/tnnls.2022.3190068"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/0165-1684(94)90029-9"},{"key":"ref18","first-page":"1436","article-title":"Flexibly fair representation learning by disentanglement","volume-title":"Proc. Int. Conf. Mach. Learn. (ICML)","author":"Creager"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00520"},{"key":"ref21","first-page":"1018","article-title":"Explicit disentanglement of appearance and perspective in generative models","volume-title":"Proc. Neural Inf. Process. Syst. (NeurIPS)","author":"Detlefsen"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00794"},{"key":"ref23","first-page":"1","article-title":"A framework for the quantitative evaluation of disentangled representations","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Eastwood"},{"key":"ref24","first-page":"1","article-title":"VSE++: Improving visual-semantic embeddings with hard negatives","volume-title":"Proc. Brit. Mach. Vis. Conf. (BMVC)","author":"Faghri"},{"issue":"1","key":"ref25","first-page":"70","article-title":"A free energy principle for the brain","volume":"100","author":"Friston","year":"2006","journal-title":"J. Physiol."},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00341"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.5555\/2969033.2969125"},{"key":"ref28","first-page":"2424","article-title":"Multi-object representation learning with iterative variational inference","volume-title":"Proc. Int. Conf. Mach. Learn. (ICML)","author":"Greff"},{"key":"ref29","first-page":"723","article-title":"A kernel two-sample test","volume":"13","author":"Gretton","year":"2012","journal-title":"J. Mach. Learn. Res."},{"key":"ref30","first-page":"2455","article-title":"Recurrent world models facilitate policy evolution","volume-title":"Proc. Neural Inf. Process. Syst. (NIPS)","author":"Ha"},{"issue":"1","key":"ref31","doi-asserted-by":"crossref","first-page":"335","DOI":"10.1016\/0167-2789(90)90087-6","article-title":"The symbol grounding problem","volume":"42","author":"Harnad","year":"1990","journal-title":"Physica D, Nonlinear Phenomena"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00385"},{"key":"ref34","first-page":"1","article-title":"\u03b2-VAE: Learning basic visual concepts with a constrained variational framework","volume-title":"Proc. Int. Conf. Learn. Represent. (ICLR)","author":"Higgins"},{"key":"ref35","first-page":"1480","article-title":"DARLA: Improving zero-shot transfer in reinforcement learning","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Higgins"},{"key":"ref36","doi-asserted-by":"crossref","first-page":"183","DOI":"10.1016\/j.neucom.2019.03.013","article-title":"Improving variational autoencoder with deep feature consistent and generative adversarial training","volume":"341","author":"Hou","year":"2019","journal-title":"Neurocomputing"},{"issue":"3","key":"ref37","doi-asserted-by":"crossref","first-page":"429","DOI":"10.1016\/S0893-6080(98)00140-3","article-title":"Nonlinear independent component analysis: Existence and uniqueness results","volume":"12","author":"Hyv\u00e4rinen","year":"1999","journal-title":"Neural Netw."},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00453"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00813"},{"key":"ref40","first-page":"1","article-title":"Now you see me (CME): Concept-based model extraction","volume-title":"Proc. ACM Int. Conf. Inf. Knowl. Manag. (CIKM) Workshop Adv. Interpretable Mach. Learn. Artif. Intell. (AIMLAI)","author":"Kazhdan"},{"key":"ref41","first-page":"2649","article-title":"Disentangling by factorising","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Kim"},{"key":"ref42","first-page":"1","article-title":"Adam: A method for stochastic optimization","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Kingma"},{"key":"ref43","first-page":"1","article-title":"Auto-encoding variational Bayes","volume-title":"Proc. Int. Conf. Learn. Represent. (ICLR)","author":"Kingma"},{"key":"ref44","first-page":"1","article-title":"Unifying visual-semantic embeddings with multimodal neural language models","volume-title":"Proc. Neural Inf. Process. Syst. (NIPS) Deep Learn. Represent. Learn. Workshop","author":"Kiros"},{"key":"ref45","first-page":"1","article-title":"Variational inference of disentangled latent concepts from unlabeled observations","volume-title":"Proc. Int. Conf. Learn. Represent. (ICLR)","author":"Kumar"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/5.726791"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2021.3135036"},{"key":"ref48","first-page":"1","article-title":"SPACE: Unsupervised object-oriented scene representation via spatial attention and decomposition","volume-title":"Proc. Int. Conf. Learn. Represent. (ICLR)","author":"Lin"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2022.3195533"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2022.3172903"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.425"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i09.7120"},{"key":"ref53","first-page":"4114","article-title":"Challenging common assumptions in the unsupervised learning of disentangled representations","volume-title":"Proc. Int. Conf. Mach. Learn. (ICML)","author":"Locatello"},{"key":"ref54","first-page":"14584","article-title":"On the fairness of disentangled representations","volume-title":"Proc. Neural Inf. Process. Syst. (NeurIPS)","author":"Locatello"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1111\/j.1756-8765.2010.01106.x"},{"key":"ref56","first-page":"4402","article-title":"Disentangling disentanglement in variational autoencoders","volume-title":"Proc. Int. Conf. Mach. Learn. (ICML)","author":"Mathieu"},{"key":"ref57","first-page":"1","article-title":"Gromov\u2013Wasserstein autoencoders","volume-title":"Proc. Int. Conf. Learn. Represent. (ICLR)","author":"Nakagawa"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP42928.2021.9506619"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/tnnls.2021.3105175"},{"key":"ref60","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"Proc. Int. Conf. Mach. Learn.","volume":"139","author":"Radford"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1146\/annurev-neuro-092920-120559"},{"key":"ref62","first-page":"9179","article-title":"Simple and effective VAE training with calibrated decoders","volume-title":"Proc. Int. Conf. Mach. Learn. (ICML)","author":"Rybkin"},{"volume-title":"Course in General Linguistics","year":"1966","author":"de Saussure","key":"ref63"},{"key":"ref64","article-title":"How to not measure disentanglement","author":"Sepliarskaia","year":"2019","journal-title":"arXiv:1910.05587"},{"key":"ref65","first-page":"1","article-title":"Very deep convolutional networks for large-scale image recognition","volume-title":"Proc. 3rd Intl. Conf. Learning Represent. (ICLR)","author":"Simonyan"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00362"},{"key":"ref67","first-page":"14222","article-title":"Are disentangled representations helpful for abstract visual reasoning?","volume-title":"Proc. Neural Inf. Process. Syst. (NeurIPS)","author":"van Steenkiste"},{"key":"ref68","first-page":"1","article-title":"Disentangling the independently controllable factors of variation by interacting with the world","volume-title":"Proc. Neural Inf. Process. Syst. (NIPS) Workshop","author":"Thomas"},{"key":"ref69","first-page":"368","article-title":"The information bottleneck method","volume-title":"Proc. Annu. Allerton Conf. Communnication, Control Comput.","author":"Tishby"},{"key":"ref70","first-page":"1","article-title":"Recent advances in autoencoder-based representation learning","volume-title":"Proc. Neural Inf. Process. Syst. (NIPS) Workshop Bayesian Deep Learn.","author":"Tschannen"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.306"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1016\/j.neuroimage.2017.06.042"},{"key":"ref74","volume":"4","author":"Wardhaugh","year":"2006","journal-title":"An Introduction to Sociolinguistics"},{"volume-title":"Knowing and Guessing: A Quantitative Study of Inference and Information","year":"1969","author":"Watanabe","key":"ref75"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1145\/3474085.3475681"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP42928.2021.9506169"},{"key":"ref78","first-page":"20554","article-title":"On completeness-aware concept-based explanations in deep neural networks","volume-title":"Proc. Neural Inf. Process. Syst. (NeurIPS)","author":"Yeh"},{"key":"ref79","first-page":"1","article-title":"QANet: Combining local convolution with global self-attention for reading comprehension","volume-title":"Proc. Int. Conf. Learn. Represent. (ICLR)","author":"Yu"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1109\/tnnls.2022.3218982"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33015885"},{"key":"ref82","first-page":"4091","article-title":"Learning hierarchical features from generative models","volume-title":"Proc. Int. Conf. Mach. Learn. (ICML)","author":"Zhao"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.235"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00580"}],"container-title":["IEEE Transactions on Neural Networks and Learning Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/5962385\/10949581\/10584324.pdf?arnumber=10584324","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,5]],"date-time":"2025-12-05T18:38:59Z","timestamp":1764959939000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10584324\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4]]},"references-count":84,"journal-issue":{"issue":"4"},"URL":"https:\/\/doi.org\/10.1109\/tnnls.2024.3404496","relation":{},"ISSN":["2162-237X","2162-2388"],"issn-type":[{"type":"print","value":"2162-237X"},{"type":"electronic","value":"2162-2388"}],"subject":[],"published":{"date-parts":[[2025,4]]}}}