{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,6]],"date-time":"2026-05-06T15:11:40Z","timestamp":1778080300518,"version":"3.51.4"},"publisher-location":"Cham","reference-count":51,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031434204","type":"print"},{"value":"9783031434211","type":"electronic"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-43421-1_35","type":"book-chapter","created":{"date-parts":[[2023,9,17]],"date-time":"2023-09-17T20:37:24Z","timestamp":1694983044000},"page":"593-609","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Learning Disentangled Discrete Representations"],"prefix":"10.1007","author":[{"given":"David","family":"Friede","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Christian","family":"Reimers","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Heiner","family":"Stuckenschmidt","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mathias","family":"Niepert","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,9,18]]},"reference":[{"key":"35_CR1","unstructured":"Adel, T., Ghahramani, Z., Weller, A.: Discovering interpretable representations for both deep generative and discriminative models. In: International Conference on Machine Learning, pp. 50\u201359. PMLR (2018)"},{"key":"35_CR2","doi-asserted-by":"crossref","unstructured":"Arcones, M.A., Gine, E.: On the bootstrap of $$U$$ and $$V$$ statistics. Annal. Statist. 20, 655\u2013674 (1992)","DOI":"10.1214\/aos\/1176348650"},{"issue":"8","key":"35_CR3","doi-asserted-by":"publisher","first-page":"1798","DOI":"10.1109\/TPAMI.2013.50","volume":"35","author":"Y Bengio","year":"2013","unstructured":"Bengio, Y., Courville, A., Vincent, P.: Representation learning: a review and new perspectives. IEEE Trans. Pattern Anal. Mach. Intell. 35(8), 1798\u20131828 (2013)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"35_CR4","unstructured":"Bengio, Y., L\u00e9onard, N., Courville, A.: Estimating or propagating gradients through stochastic neurons for conditional computation. arXiv:1308.3432 (2013)"},{"key":"35_CR5","unstructured":"Burgess, C.P., et al.: Understanding disentangling in $$\\beta $$-vae. arXiv:1804.03599 (2018)"},{"key":"35_CR6","unstructured":"Chen, R.T., Li, X., Grosse, R.B., Duvenaud, D.K.: Isolating sources of disentanglement in variational autoencoders. In: Advances in Neural Information Processing Systems, vol. 31, pp. 2615\u20132625 (2018)"},{"key":"35_CR7","unstructured":"Creager, E., et al.: Flexibly fair representation learning by disentanglement. In: International Conference on Machine Learning, pp. 1436\u20131445. PMLR (2019)"},{"key":"35_CR8","unstructured":"Dupont, E.: Learning disentangled joint continuous and discrete representations. In: Advances in Neural Information Processing Systems, vol. 31 (2018)"},{"key":"35_CR9","unstructured":"Eastwood, C., Williams, C.K.: A framework for the quantitative evaluation of disentangled representations. In: International Conference on Learning Representations (2018)"},{"key":"35_CR10","unstructured":"Friede, D., Niepert, M.: Efficient learning of discrete-continuous computation graphs. In: Advances in Neural Information Processing Systems, vol. 34, pp. 6720\u20136732 (2021)"},{"key":"35_CR11","unstructured":"Gondal, M.W., et al.: On the transfer of inductive bias from simulation to the real world: a new disentanglement dataset. In: Advances in Neural Information Processing Systems, vol. 32 (2019)"},{"key":"35_CR12","unstructured":"Grathwohl, W., Choi, D., Wu, Y., Roeder, G., Duvenaud, D.: Backpropagation through the void: optimizing control variates for black-box gradient estimation. In: International Conference on Learning Representations (2018)"},{"key":"35_CR13","unstructured":"Hafner, D., Lillicrap, T., Norouzi, M., Ba, J.: Mastering Atari with discrete world models. arXiv:2010.02193 (2020)"},{"key":"35_CR14","unstructured":"Hafner, D., Pasukonis, J., Ba, J., Lillicrap, T.: Mastering diverse domains through world models. arXiv:2301.04104 (2023)"},{"key":"35_CR15","unstructured":"Higgins, I., et al.: Towards a definition of disentangled representations. arXiv:1812.02230 (2018)"},{"key":"35_CR16","unstructured":"Higgins, I., et al.: $$\\beta $$-VAE: learning basic visual concepts with a constrained variational framework. In: International Conference on Learning Representations (2017)"},{"key":"35_CR17","unstructured":"Jang, E., Gu, S., Poole, B.: Categorical reparameterization with Gumbel-softmax. In: International Conference on Learning Representations (2017)"},{"key":"35_CR18","unstructured":"Jeong, Y., Song, H.O.: Learning discrete and continuous factors of data via alternating disentanglement. In: International Conference on Machine Learning, pp. 3091\u20133099. PMLR (2019)"},{"key":"35_CR19","unstructured":"Kim, H., Mnih, A.: Disentangling by factorising. In: International Conference on Machine Learning, pp. 2649\u20132658. PMLR (2018)"},{"key":"35_CR20","unstructured":"Kingma, D.P., Welling, M.: Auto-encoding variational Bayes. In: International Conference on Learning Representations (2013)"},{"key":"35_CR21","unstructured":"Klindt, D.A., et al.: Towards nonlinear disentanglement in natural data with temporal sparse coding. In: International Conference on Learning Representations (2021)"},{"key":"35_CR22","unstructured":"Kumar, A., Sattigeri, P., Balakrishnan, A.: Variational inference of disentangled latent concepts from unlabeled observations. In: International Conference on Learning Representations (2017)"},{"key":"35_CR23","unstructured":"LeCun, Y., Huang, F.J., Bottou, L.: Learning methods for generic object recognition with invariance to pose and lighting. In: Proceedings of the 2004 IEEE Computer Society Conference on Computer Vision and Pattern Recognition, 2004. CVPR 2004. vol. 2, pp. II-104. IEEE (2004)"},{"key":"35_CR24","unstructured":"Locatello, F., Abbati, G., Rainforth, T., Bauer, S., Sch\u00f6lkopf, B., Bachem, O.: On the fairness of disentangled representations. In: Advances in Neural Information Processing Systems, vol. 32 (2019)"},{"key":"35_CR25","unstructured":"Locatello, F., et al.: Challenging common assumptions in the unsupervised learning of disentangled representations. In: International Conference on Machine Learning, pp. 4114\u20134124. PMLR (2019)"},{"key":"35_CR26","unstructured":"Locatello, F., Poole, B., R\u00e4tsch, G., Sch\u00f6lkopf, B., Bachem, O., Tschannen, M.: Weakly-supervised disentanglement without compromises. In: International Conference on Machine Learning, pp. 6348\u20136359. PMLR (2020)"},{"key":"35_CR27","unstructured":"Locatello, F., Tschannen, M., Bauer, S., R\u00e4tsch, G., Sch\u00f6lkopf, B., Bachem, O.: Disentangling factors of variations using few labels. In: International Conference on Learning Representations (2020)"},{"key":"35_CR28","unstructured":"Maddison, C.J., Mnih, A., Teh, Y.W.: The concrete distribution: a continuous relaxation of discrete random variables. In: International Conference on Learning Representations (2017)"},{"key":"35_CR29","unstructured":"Makhzani, A., Shlens, J., Jaitly, N., Goodfellow, I., Frey, B.: Adversarial autoencoders. arXiv:1511.05644 (2015)"},{"issue":"11","key":"35_CR30","doi-asserted-by":"publisher","first-page":"5847","DOI":"10.1109\/TIT.2010.2068870","volume":"56","author":"X Nguyen","year":"2010","unstructured":"Nguyen, X., Wainwright, M.J., Jordan, M.I.: Estimating divergence functionals and the likelihood ratio by convex risk minimization. IEEE Trans. Inf. Theory 56(11), 5847\u20135861 (2010)","journal-title":"IEEE Trans. Inf. Theory"},{"key":"35_CR31","unstructured":"Ozair, S., Li, Y., Razavi, A., Antonoglou, I., Van Den Oord, A., Vinyals, O.: Vector quantized models for planning. In: International Conference on Machine Learning, pp. 8302\u20138313. PMLR (2021)"},{"key":"35_CR32","unstructured":"Peters, J., Janzing, D., Sch\u00f6lkopf, B.: Elements of causal inference: foundations and learning algorithms. The MIT Press (2017)"},{"key":"35_CR33","unstructured":"Ramesh, A., et al.: Zero-shot text-to-image generation. In: International Conference on Machine Learning, pp. 8821\u20138831. PMLR (2021)"},{"key":"35_CR34","unstructured":"Razavi, A., Van den Oord, A., Vinyals, O.: Generating diverse high-fidelity images with VQ-VAE-2. In: Advances in Neural Information Processing Systems, vol. 32 (2019)"},{"key":"35_CR35","unstructured":"Reed, S.E., Zhang, Y., Zhang, Y., Lee, H.: Deep visual analogy-making. In: Advances in Neural Information Processing Systems, vol. 28 (2015)"},{"key":"35_CR36","unstructured":"Ridgeway, K., Mozer, M.C.: Learning deep disentangled embeddings with the F-statistic loss. In: Advances in Neural Information Processing Systems, vol. 31 (2018)"},{"key":"35_CR37","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P., Ommer, B.: High-resolution image synthesis with latent diffusion models. IEEE 2022. In: CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 10674\u201310685 (2022)","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"35_CR38","unstructured":"Sch\u00f6lkopf, B., Janzing, D., Peters, J., Sgouritsa, E., Zhang, K., Mooij, J.M.: On causal and anticausal learning. In: International Conference on Machine Learning (2012)"},{"key":"35_CR39","unstructured":"Shayer, O., Levi, D., Fetaya, E.: Learning discrete weights using the local reparameterization trick. In: International Conference on Learning Representations (2018)"},{"key":"35_CR40","unstructured":"Shu, R., Chen, Y., Kumar, A., Ermon, S., Poole, B.: Weakly supervised disentanglement with guarantees. In: International Conference on Learning Representations (2020)"},{"issue":"5","key":"35_CR41","doi-asserted-by":"publisher","first-page":"1009","DOI":"10.1007\/s10463-011-0343-8","volume":"64","author":"M Sugiyama","year":"2012","unstructured":"Sugiyama, M., Suzuki, T., Kanamori, T.: Density-ratio matching under the Bregman divergence: a unified framework of density-ratio estimation. Ann. Inst. Stat. Math. 64(5), 1009\u20131044 (2012)","journal-title":"Ann. Inst. Stat. Math."},{"key":"35_CR42","unstructured":"Tr\u00e4uble, F., et al.: On disentangled representations learned from correlated data. In: International Conference on Machine Learning, pp. 10401\u201310412. PMLR (2021)"},{"key":"35_CR43","unstructured":"Tschannen, M., Bachem, O., Lucic, M.: Recent advances in autoencoder-based representation learning. arXiv:1812.05069 (2018)"},{"key":"35_CR44","unstructured":"Tucker, G., Mnih, A., Maddison, C.J., Lawson, J., Sohl-Dickstein, J.: REBAR: low-variance, unbiased gradient estimates for discrete latent variable models. In: Advances in Neural Information Processing Systems, vol. 30 (2017)"},{"key":"35_CR45","unstructured":"Van Den Oord, A., Vinyals, O., et al.: Neural discrete representation learning. In: Advances in Neural Information Processing Systems, vol. 30 (2017)"},{"key":"35_CR46","unstructured":"Van Steenkiste, S., Locatello, F., Schmidhuber, J., Bachem, O.: Are disentangled representations helpful for abstract visual reasoning? In: Advances in Neural Information Processing Systems, vol. 32 (2019)"},{"key":"35_CR47","unstructured":"Vaswani, A., et al.: Attention is all you need. In: Advances in Neural Information Processing Systems, vol. 30 (2017)"},{"issue":"1","key":"35_CR48","doi-asserted-by":"publisher","first-page":"66","DOI":"10.1147\/rd.41.0066","volume":"4","author":"S Watanabe","year":"1960","unstructured":"Watanabe, S.: Information theoretical analysis of multivariate correlation. IBM J. Res. Dev. 4(1), 66\u201382 (1960)","journal-title":"IBM J. Res. Dev."},{"key":"35_CR49","unstructured":"Watters, N., Matthey, L., Borgeaud, S., Kabra, R., Lerchner, A.: Spriteworld: a flexible, configurable reinforcement learning environment (2019)"},{"key":"35_CR50","unstructured":"Watters, N., Matthey, L., Burgess, C.P., Lerchner, A.: Spatial broadcast decoder: a simple architecture for learning disentangled representations in VAEs. arXiv:1901.07017 (2019)"},{"key":"35_CR51","doi-asserted-by":"crossref","unstructured":"Williams, R.J.: Simple statistical gradient-following algorithms for connectionist reinforcement learning. Reinforcement Learning, pp. 5\u201332 (1992)","DOI":"10.1007\/978-1-4615-3618-5_2"}],"container-title":["Lecture Notes in Computer Science","Machine Learning and Knowledge Discovery in Databases: Research Track"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-43421-1_35","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,9,17]],"date-time":"2023-09-17T20:47:26Z","timestamp":1694983646000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-43421-1_35"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031434204","9783031434211"],"references-count":51,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-43421-1_35","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"18 September 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECML PKDD","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Joint European Conference on Machine Learning and Knowledge Discovery in Databases","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Turin","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18 September 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22 September 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ecml2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/2023.ecmlpkdd.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"CMT","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"829","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"196","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"24% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.63","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"4.5","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Applied Data Science Track: 239 submissions, 58 accepted papers; Demo Track: 31 submissions, 16 accepted papers.","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}