{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,11]],"date-time":"2025-09-11T19:16:57Z","timestamp":1757618217877,"version":"3.44.0"},"reference-count":89,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2025,6,6]],"date-time":"2025-06-06T00:00:00Z","timestamp":1749168000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,6,6]],"date-time":"2025-06-06T00:00:00Z","timestamp":1749168000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Stat Comput"],"published-print":{"date-parts":[[2025,10]]},"DOI":"10.1007\/s11222-025-10657-z","type":"journal-article","created":{"date-parts":[[2025,6,6]],"date-time":"2025-06-06T03:11:09Z","timestamp":1749179469000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Information preservation with wasserstein autoencoders: generation consistency and adversarial robustness"],"prefix":"10.1007","volume":"35","author":[{"given":"Anish","family":"Chakrabarty","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Arkaprabha","family":"Basu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Swagatam","family":"Das","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,6,6]]},"reference":[{"key":"10657_CR1","doi-asserted-by":"crossref","unstructured":"Ashtiani, H., Ben-David, S., Mehrabian, A.: Sample-efficient learning of mixtures. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 32 (2018)","DOI":"10.1609\/aaai.v32i1.11627"},{"issue":"1","key":"10657_CR2","doi-asserted-by":"publisher","first-page":"391","DOI":"10.1214\/23-EJS2104","volume":"17","author":"H Asatryan","year":"2023","unstructured":"Asatryan, H., Gottschalk, H., Lippert, M., Rottmann, M.: A convenient infinite dimensional framework for generative adversarial learning. Electron. J. Stat 17(1), 391\u2013428 (2023)","journal-title":"Electron. J. Stat"},{"key":"10657_CR3","doi-asserted-by":"crossref","unstructured":"Acharya, J., Jafarpour, A., Orlitsky, A., Suresh, A.T.: Sorting with adversarial comparators and application to density estimation. In: 2014 IEEE International Symposium on Information Theory, pp. 1682\u20131686 (2014). IEEE","DOI":"10.1109\/ISIT.2014.6875120"},{"key":"10657_CR4","unstructured":"Anil, C., Lucas, J., Grosse, R.: Sorting out lipschitz function approximation. In: International Conference on Machine Learning, pp. 291\u2013301 (2019). PMLR"},{"issue":"3","key":"10657_CR5","doi-asserted-by":"publisher","first-page":"930","DOI":"10.1109\/18.256500","volume":"39","author":"AR Barron","year":"1993","unstructured":"Barron, A.R.: Universal approximation bounds for superpositions of a sigmoidal function. IEEE Trans. Inf. Theory 39(3), 930\u2013945 (1993)","journal-title":"IEEE Trans. Inf. Theory"},{"issue":"8","key":"10657_CR6","doi-asserted-by":"publisher","first-page":"1798","DOI":"10.1109\/TPAMI.2013.50","volume":"35","author":"Y Bengio","year":"2013","unstructured":"Bengio, Y., Courville, A., Vincent, P.: Representation learning: A review and new perspectives. IEEE Trans. Pattern Anal. Mach. Intell. 35(8), 1798\u20131828 (2013)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"1","key":"10657_CR7","doi-asserted-by":"publisher","first-page":"190","DOI":"10.1016\/S0047-259X(03)00079-4","volume":"88","author":"L Baringhaus","year":"2004","unstructured":"Baringhaus, L., Franz, C.: On a new multivariate two-sample test. J. Multivar. Anal. 88(1), 190\u2013206 (2004)","journal-title":"J. Multivar. Anal."},{"issue":"1","key":"10657_CR8","doi-asserted-by":"publisher","first-page":"300","DOI":"10.1137\/S0895479895296896","volume":"21","author":"A Ben-Israel","year":"1999","unstructured":"Ben-Israel, A.: The change-of-variables formula using matrix volume. SIAM J. Matrix Anal. Appl. 21(1), 300\u2013312 (1999)","journal-title":"SIAM J. Matrix Anal. Appl."},{"key":"10657_CR9","unstructured":"Birrell, J., Katsoulakis, M.A., Rey-Bellet, L., Zhu, W.: Structure-preserving gans. In: International Conference on Machine Learning (2022)"},{"key":"10657_CR10","doi-asserted-by":"publisher","first-page":"46","DOI":"10.1007\/BF02776078","volume":"52","author":"J Bourgain","year":"1985","unstructured":"Bourgain, J.: On lipschitz embedding of finite metric spaces in hilbert space. Israel J. Math. 52, 46\u201352 (1985)","journal-title":"Israel J. Math."},{"issue":"4","key":"10657_CR11","doi-asserted-by":"publisher","first-page":"375","DOI":"10.1002\/cpa.3160440402","volume":"44","author":"Y Brenier","year":"1991","unstructured":"Brenier, Y.: Polar factorization and monotone rearrangement of vector-valued functions. Commun. Pure Appl. Math. 44(4), 375\u2013417 (1991)","journal-title":"Commun. Pure Appl. Math."},{"key":"10657_CR12","doi-asserted-by":"crossref","unstructured":"Bartal, Y., Recht, B., Schulman, L.J.: Dimensionality reduction: beyond the johnson-lindenstrauss bound. In: Proceedings of the Twenty-second Annual ACM-SIAM Symposium on Discrete Algorithms, pp. 868\u2013887 (2011). SIAM","DOI":"10.1137\/1.9781611973082.68"},{"key":"10657_CR13","doi-asserted-by":"publisher","first-page":"547","DOI":"10.1007\/s002200000257","volume":"214","author":"LA Caffarelli","year":"2000","unstructured":"Caffarelli, L.A.: Monotonicity properties of optimal transportation and the fkg and related inequalities. Commun. Math. Phys. 214, 547\u2013563 (2000)","journal-title":"Commun. Math. Phys."},{"key":"10657_CR14","unstructured":"Chakraborty, S., Bartlett, P.: A statistical analysis of wasserstein autoencoders for intrinsically low-dimensional data. In: The 12th International Conference on Learning Representations (2024)"},{"key":"10657_CR15","first-page":"17098","volume":"34","author":"A Chakrabarty","year":"2021","unstructured":"Chakrabarty, A., Das, S.: Statistical regeneration guarantees of the wasserstein autoencoder with latent space consistency. Advances in Neural Information Processing Systems (NeurIPS) 34, 17098\u201317110 (2021)","journal-title":"Advances in Neural Information Processing Systems (NeurIPS)"},{"key":"10657_CR16","doi-asserted-by":"publisher","first-page":"1007","DOI":"10.1016\/j.jde.2020.09.032","volume":"271","author":"M Colombo","year":"2021","unstructured":"Colombo, M., Fathi, M.: Bounds on optimal transport maps onto log-concave measures. J. Differ. Equ 271, 1007\u20131022 (2021)","journal-title":"J. Differ. Equ"},{"key":"10657_CR17","unstructured":"Courty, N., Flamary, R., Ducoffe, M.: Learning wasserstein embeddings. In: International Conference on Learning Representations (2018)"},{"key":"10657_CR18","doi-asserted-by":"publisher","first-page":"3752","DOI":"10.1214\/16-EJS1216","volume":"10","author":"M Chen","year":"2016","unstructured":"Chen, M., Gao, C., Ren, Z.: A general decision theory for Huber\u2019s $$\\epsilon $$-contamination model. Electron. J. Stat. 10, 3752\u20133774 (2016)","journal-title":"Electron. J. Stat."},{"key":"10657_CR19","unstructured":"Chen, M., Jiang, H., Liao, W., Zhao, T.: Efficient approximation of deep relu networks for functions on low dimensional manifolds. Advances in neural information processing systems 32 (2019)"},{"key":"10657_CR20","unstructured":"Chen, Z., Katsoulakis, M., Rey-Bellet, L., Zhu, W.: Sample complexity of probability divergences under group symmetry. In: International Conference on Machine Learning, pp. 4713\u20134734 (2023). PMLR"},{"issue":"3","key":"10657_CR21","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/1970392.1970395","volume":"58","author":"EJ Cand\u00e8s","year":"2011","unstructured":"Cand\u00e8s, E.J., Li, X., Ma, Y., Wright, J.: Robust principal component analysis? Journal of the ACM (JACM) 58(3), 1\u201337 (2011)","journal-title":"Journal of the ACM (JACM)"},{"issue":"12","key":"10657_CR22","doi-asserted-by":"publisher","first-page":"2405","DOI":"10.1002\/cpa.21707","volume":"70","author":"P-A Chiappori","year":"2017","unstructured":"Chiappori, P.-A., McCann, R.J., Pass, B.: Multi-to one-dimensional optimal transport. Commun. Pure Appl. Math. 70(12), 2405\u20132444 (2017)","journal-title":"Commun. Pure Appl. Math."},{"key":"10657_CR23","unstructured":"Chernodub, A., Nowicki, D.: Norm-preserving orthogonal permutation linear unit activation functions (oplu). arXiv preprint arXiv:1604.02313 (2016)"},{"key":"10657_CR24","unstructured":"Caragea, A., Petersen, P., Voigtlaender, F.: Neural network approximation and estimation of classifiers with classification boundary in a barron class. arXiv preprint arXiv:2011.09363 (2020)"},{"issue":"1","key":"10657_CR25","doi-asserted-by":"publisher","first-page":"127","DOI":"10.1007\/s00365-021-09548-z","volume":"55","author":"I Daubechies","year":"2022","unstructured":"Daubechies, I., DeVore, R., Foucart, S., Hanin, B., Petrova, G.: Nonlinear approximation and (deep) relu networks. Constr. Approx. 55(1), 127\u2013172 (2022)","journal-title":"Constr. Approx."},{"key":"10657_CR26","doi-asserted-by":"crossref","unstructured":"Devroye, L., Gyorfi, L.: No empirical probability measure can converge in the total variation sense for all distributions. The Annals of Statistics, 1496\u20131499 (1990)","DOI":"10.1214\/aos\/1176347765"},{"key":"10657_CR27","unstructured":"Dvurechensky, P., Gasnikov, A., Kroshnin, A.: Computational optimal transport: Complexity by accelerated gradient descent is better than by sinkhorn\u2019s algorithm. In: Proceedings of the 35th International Conference on Machine Learning. Proceedings of Machine Learning Research, vol. 80 (2018)"},{"key":"10657_CR28","doi-asserted-by":"crossref","unstructured":"Devroye, L., Lugosi, G.: Combinatorial Methods in Density Estimation. Springer (2001)","DOI":"10.1007\/978-1-4613-0125-7"},{"key":"10657_CR29","doi-asserted-by":"crossref","unstructured":"David, G., Semmes, S.: Regular mappings between dimensions. Publicacions Matematiques, 369\u2013417 (2000)","DOI":"10.5565\/PUBLMAT_44200_02"},{"key":"10657_CR30","unstructured":"Dai, B., Wipf, D.: Diagnosing and enhancing VAE models. In: International Conference on Learning Representations (2019)"},{"issue":"1","key":"10657_CR31","first-page":"1573","volume":"19","author":"B Dai","year":"2018","unstructured":"Dai, B., Wang, Y., Aston, J., Hua, G., Wipf, D.: Connections with robust pca and the role of emergent sparsity in variational autoencoder models. J. Mach. Learn. Res. 19(1), 1573\u20131614 (2018)","journal-title":"J. Mach. Learn. Res."},{"issue":"7","key":"10657_CR32","doi-asserted-by":"publisher","first-page":"1858","DOI":"10.1109\/TIT.2003.813506","volume":"49","author":"DM Endres","year":"2003","unstructured":"Endres, D.M., Schindelin, J.E.: A new metric for probability distributions. IEEE Trans. Inf. Theory 49(7), 1858\u20131860 (2003)","journal-title":"IEEE Trans. Inf. Theory"},{"issue":"1","key":"10657_CR33","doi-asserted-by":"publisher","first-page":"155","DOI":"10.1093\/mnras\/225.1.155","volume":"225","author":"G Fasano","year":"1987","unstructured":"Fasano, G., Franceschini, A.: A multidimensional version of the kolmogorov-smirnov test. Mon. Not. R. Astron. Soc. 225(1), 155\u2013170 (1987)","journal-title":"Mon. Not. R. Astron. Soc."},{"key":"10657_CR34","unstructured":"Franz, C.: cramer: multivariate nonparametric cramer-test for the two-sample-problem. R package version 0.8-1 (2006)"},{"issue":"1","key":"10657_CR35","first-page":"723","volume":"13","author":"A Gretton","year":"2012","unstructured":"Gretton, A., Borgwardt, K.M., Rasch, M.J., Sch\u00f6lkopf, B., Smola, A.: A kernel two-sample test. J. Mach. Learn. Res 13(1), 723\u2013773 (2012)","journal-title":"J. Mach. Learn. Res"},{"key":"10657_CR36","doi-asserted-by":"crossref","unstructured":"Gin\u00e9, E., Guillou, A.: Rates of strong uniform consistency for multivariate kernel density estimators. In: Annales de l\u2019Institut Henri Poincare (B) Probability and Statistics, vol. 38, pp. 907\u2013921 (2002). Elsevier","DOI":"10.1016\/S0246-0203(02)01128-7"},{"issue":"8","key":"10657_CR37","doi-asserted-by":"publisher","first-page":"4838","DOI":"10.1109\/TIT.2017.2713820","volume":"63","author":"L-A Gottlieb","year":"2017","unstructured":"Gottlieb, L.-A., Kontorovich, A., Krauthgamer, R.: Efficient regression in metric spaces via approximate lipschitz extension. IEEE Trans. Inf. Theory 63(8), 4838\u20134849 (2017)","journal-title":"IEEE Trans. Inf. Theory"},{"issue":"1","key":"10657_CR38","doi-asserted-by":"publisher","first-page":"259","DOI":"10.1007\/s00365-021-09543-4","volume":"55","author":"R Gribonval","year":"2022","unstructured":"Gribonval, R., Kutyniok, G., Nielsen, M., Voigtlaender, F.: Approximation spaces of deep neural networks. Constr. Approx. 55(1), 259\u2013367 (2022)","journal-title":"Constr. Approx."},{"key":"10657_CR39","doi-asserted-by":"crossref","unstructured":"Gin\u00e9, E., Nickl, R.: Mathematical Foundations of Infinite-dimensional Statistical Models. Cambridge university press (2021)","DOI":"10.1017\/9781009022811"},{"key":"10657_CR40","unstructured":"Goodfellow, I., Pouget-Abadie, J., Mirza, M., Xu, B., Warde-Farley, D., Ozair, S., Courville, A., Bengio, Y.: Generative adversarial nets. In: Advances in Neural Information Processing Systems, vol. 27 (2014)"},{"key":"10657_CR41","doi-asserted-by":"crossref","unstructured":"Huster, T., Chiang, C.-Y.J., Chadha, R.: Limitations of the lipschitz constant as a defense against adversarial examples. In: ECML PKDD 2018 Workshops. Springer (2019)","DOI":"10.1007\/978-3-030-13453-2_2"},{"key":"10657_CR42","unstructured":"Husain, H., Nock, R., Williamson, R.C.: A primal-dual link between gans and autoencoders. Advances in Neural Information Processing Systems 32 (2019)"},{"issue":"3","key":"10657_CR43","doi-asserted-by":"publisher","first-page":"429","DOI":"10.1016\/S0893-6080(98)00140-3","volume":"12","author":"A Hyv\u00e4rinen","year":"1999","unstructured":"Hyv\u00e4rinen, A., Pajunen, P.: Nonlinear independent component analysis: Existence and uniqueness results. Neural Netw. 12(3), 429\u2013439 (1999)","journal-title":"Neural Netw."},{"key":"10657_CR44","doi-asserted-by":"publisher","first-page":"189","DOI":"10.1090\/conm\/026\/737400","volume":"26","author":"WB Johnson","year":"1984","unstructured":"Johnson, W.B., Lindenstrauss, J.: Extensions of Lipschitz mappings into a Hilbert space. Conference in modern analysis and probability 26, 189\u2013206 (1984)","journal-title":"Conference in modern analysis and probability"},{"key":"10657_CR45","first-page":"21775","volume":"33","author":"A Jain","year":"2020","unstructured":"Jain, A., Orlitsky, A.: A general method for robust learning from batches. Adv. Neural. Inf. Process. Syst. 33, 21775\u201321785 (2020)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"10657_CR46","doi-asserted-by":"crossref","unstructured":"Jiang, Z., Zheng, Y., Tan, H., Tang, B., Zhou, H.: Variational deep embedding: An unsupervised and generative approach to clustering. In: Proceedings of the Twenty-Sixth International Joint Conference on Artificial Intelligence, IJCAI-17, pp. 1965\u20131972 (2017)","DOI":"10.24963\/ijcai.2017\/273"},{"issue":"12","key":"10657_CR47","doi-asserted-by":"publisher","first-page":"7649","DOI":"10.1109\/TIT.2018.2874447","volume":"64","author":"JM Klusowski","year":"2018","unstructured":"Klusowski, J.M., Barron, A.R.: Approximation by combinations of relu and squared relu ridge functions with $$l^{1}$$ and $$l^{0}$$ controls. IEEE Trans. Inf. Theory 64(12), 7649\u20137656 (2018)","journal-title":"IEEE Trans. Inf. Theory"},{"key":"10657_CR48","unstructured":"Khemakhem, I., Kingma, D., Monti, R., Hyvarinen, A.: Variational autoencoders and nonlinear ica: A unifying framework. In: International Conference on Artificial Intelligence and Statistics, pp. 2207\u20132217 (2020). PMLR"},{"key":"10657_CR49","unstructured":"Kingma, D.P., Welling, M.: Auto-encoding variational bayes. In: 2nd International Conference on Learning Representations (2014)"},{"key":"10657_CR50","unstructured":"LeCun, Y., Cortes, C., Burges\u00a0J.c., C.: MNIST handwritten digit database. https:\/\/yann.lecun.com\/exdb\/mnist\/"},{"key":"10657_CR51","unstructured":"Li, C.T., Farnia, F.: Mode-seeking divergences: Theory and applications to gans. In: Proceedings of The 26th International Conference on Artificial Intelligence and Statistics. Proceedings of Machine Learning Research, vol. 206, pp. 8321\u20138350. PMLR (2023)"},{"key":"10657_CR52","doi-asserted-by":"publisher","first-page":"3613","DOI":"10.1214\/19-EJS1617","volume":"13","author":"H Liu","year":"2019","unstructured":"Liu, H., Gao, C.: Density estimation with contamination: minimax rates and theory of adaptation. Electron. J. Stat. 13, 3613\u20133653 (2019)","journal-title":"Electron. J. Stat."},{"key":"10657_CR53","unstructured":"Lee, H., Ge, R., Ma, T., Risteski, A., Arora, S.: On the ability of neural nets to express distributions. In: Conference on Learning Theory, pp. 1271\u20131296 (2017). PMLR"},{"key":"10657_CR54","first-page":"9151","volume":"35","author":"T Liu","year":"2022","unstructured":"Liu, T., Kumar, P., Zhou, R., Liu, X.: Learning from few samples: Transformation-invariant svms with composition and locality at multiple scales. Adv. Neural. Inf. Process. Syst. 35, 9151\u20139163 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"issue":"1","key":"10657_CR55","doi-asserted-by":"publisher","first-page":"312","DOI":"10.1093\/imaiai\/iaac020","volume":"12","author":"Z Liu","year":"2022","unstructured":"Liu, Z., Loh, P.-L.: Robust W-GAN-based estimation under Wasserstein contamination. Information and Inference: A Journal of the IMA 12(1), 312\u2013362 (2022)","journal-title":"Information and Inference: A Journal of the IMA"},{"key":"10657_CR56","doi-asserted-by":"crossref","unstructured":"Larsen, K.G., Nelson, J.: Optimality of the johnson-lindenstrauss lemma. In: 58th Annual Symposium on Foundations of Computer Science (FOCS), pp. 633\u2013638 (2017). IEEE","DOI":"10.1109\/FOCS.2017.64"},{"key":"10657_CR57","unstructured":"Moriakov, N., Adler, J., Teuwen, J.: Kernel of cyclegan as a principal homogeneous space. In: International Conference on Learning Representations (2020)"},{"issue":"2","key":"10657_CR58","doi-asserted-by":"publisher","first-page":"309","DOI":"10.1215\/S0012-7094-95-08013-2","volume":"80","author":"RJ McCann","year":"1995","unstructured":"McCann, R.J.: Existence and uniqueness of monotone measure-preserving maps. Duke Math. J. 80(2), 309\u2013323 (1995)","journal-title":"Duke Math. J."},{"issue":"1","key":"10657_CR59","doi-asserted-by":"publisher","first-page":"78","DOI":"10.1137\/18M1189336","volume":"1","author":"H Montanelli","year":"2019","unstructured":"Montanelli, H., Du, Q.: New error bounds for deep relu networks using sparse grids. SIAM Journal on Mathematics of Data Science 1(1), 78\u201392 (2019)","journal-title":"SIAM Journal on Mathematics of Data Science"},{"key":"10657_CR60","unstructured":"Modeste, T., Dombry, C.: Characterization of translation invariant mmd on r d and connections with wasserstein distances (2022)"},{"key":"10657_CR61","doi-asserted-by":"crossref","unstructured":"Mahabadi, S., Makarychev, K., Makarychev, Y., Razenshteyn, I.: Nonlinear dimension reduction via outer bi-lipschitz extensions. In: Proceedings of the 50th Annual ACM SIGACT Symposium on Theory of Computing, pp. 1088\u20131101 (2018)","DOI":"10.1145\/3188745.3188828"},{"issue":"3","key":"10657_CR62","doi-asserted-by":"publisher","first-page":"1475","DOI":"10.1007\/s00205-020-01569-5","volume":"238","author":"RJ McCann","year":"2020","unstructured":"McCann, R.J., Pass, B.: Optimal transportation between unequal dimensions. Arch. Ration. Mech. Anal. 238(3), 1475\u20131520 (2020)","journal-title":"Arch. Ration. Mech. Anal."},{"issue":"2","key":"10657_CR63","doi-asserted-by":"publisher","first-page":"429","DOI":"10.2307\/1428011","volume":"29","author":"A M\u00fcller","year":"1997","unstructured":"M\u00fcller, A.: Integral probability metrics and their generating classes of functions. Adv. Appl. Probab. 29(2), 429\u2013443 (1997)","journal-title":"Adv. Appl. Probab."},{"key":"10657_CR64","doi-asserted-by":"publisher","first-page":"177","DOI":"10.1007\/s10959-007-0058-1","volume":"20","author":"R Nickl","year":"2007","unstructured":"Nickl, R., P\u00f6tscher, B.M.: Bracketing metric entropy rates and empirical central limit theorems for function classes of besov-and sobolev-type. J. Theor. Probab. 20, 177\u2013199 (2007)","journal-title":"J. Theor. Probab."},{"key":"10657_CR65","doi-asserted-by":"crossref","unstructured":"Peacock, J.A.: Two-dimensional goodness-of-fit testing in astronomy. Monthly Notices of the Royal Astronomical Society 202(3) (1983)","DOI":"10.1093\/mnras\/202.3.615"},{"key":"10657_CR66","unstructured":"Puritz, C., Ness-Cohn, E., Braun, R.: fasano. franceschini. test: An implementation of a multidimensional ks test in r. arXiv preprint arXiv:2106.10539 (2021)"},{"key":"10657_CR67","doi-asserted-by":"publisher","first-page":"296","DOI":"10.1016\/j.neunet.2018.08.019","volume":"108","author":"P Petersen","year":"2018","unstructured":"Petersen, P., Voigtlaender, F.: Optimal approximation of piecewise smooth functions using deep relu neural networks. Neural Netw. 108, 296\u2013330 (2018)","journal-title":"Neural Netw."},{"key":"10657_CR68","unstructured":"Pope, P., Zhu, C., Abdelkader, A., Goldblum, M., Goldstein, T.: The intrinsic dimension of images and its impact on learning. In: International Conference on Learning Representations (2021)"},{"key":"10657_CR69","doi-asserted-by":"crossref","unstructured":"Rolinek, M., Zietlow, D., Martius, G.: Variational autoencoders pursue pca directions (by accident). In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12406\u201312415 (2019)","DOI":"10.1109\/CVPR.2019.01269"},{"key":"10657_CR70","unstructured":"Sriperumbudur, B.K., Fukumizu, K., Gretton, A., Sch\u00f6lkopf, B., Lanckriet, G.R.: On integral probability metrics, $$\\phi $$-divergences and binary classification. preprint arXiv:0901.2698 (2009)"},{"key":"10657_CR71","first-page":"1517","volume":"11","author":"BK Sriperumbudur","year":"2010","unstructured":"Sriperumbudur, B.K., Gretton, A., Fukumizu, K., Sch\u00f6lkopf, B., Lanckriet, G.R.: Hilbert space embeddings and metrics on probability measures. J. Mach. Learn. Res. 11, 1517\u20131561 (2010)","journal-title":"J. Mach. Learn. Res."},{"key":"10657_CR72","unstructured":"Suzuki, T.: Adaptivity of deep reLU network for learning in besov and mixed smooth besov spaces: optimal rate and curse of dimensionality. In: International Conference on Learning Representations (2019)"},{"key":"10657_CR73","unstructured":"Shen, Z., Yang, H., Zhang, S.: Deep network approximation characterized by number of neurons. arXiv preprint arXiv:1906.05497 (2019)"},{"key":"10657_CR74","unstructured":"Tanielian, U., Biau, G.: Approximating lipschitz continuous functions with groupsort neural networks. In: International Conference on Artificial Intelligence and Statistics, pp. 442\u2013450 (2021). PMLR"},{"key":"10657_CR75","unstructured":"Tolstikhin, I., Bousquet, O., Gelly, S., Schoelkopf, B.: Wasserstein auto-encoders. In: International Conference on Learning Representations (2018)"},{"key":"10657_CR76","doi-asserted-by":"crossref","unstructured":"Topsoe, F.: Some inequalities for information divergence and related measures of discrimination. IEEE Trans. Inf. Theory 46(4), 1602\u20131609 (2000)","DOI":"10.1109\/18.850703"},{"key":"10657_CR77","unstructured":"Vaart, A.W.: Asymptotic Statistics. Cambridge Series in Statistical and Probabilistic Mathematics. Cambridge University Press (2000)"},{"key":"10657_CR78","unstructured":"Vaart, A., Wellner, J.A.: Weak Convergence and Empirical Processes: With Applications to Statistics. Springer Series in Statistics. Springer (1996)"},{"key":"10657_CR79","doi-asserted-by":"crossref","unstructured":"Vladimirova, M., Girard, S., Nguyen, H., Arbel, J.: Sub-weibull distributions: Generalizing sub-gaussian and sub-exponential properties to heavier tailed distributions. Stat 9(1) (2020)","DOI":"10.1002\/sta4.318"},{"key":"10657_CR80","doi-asserted-by":"crossref","unstructured":"Van\u00a0Handel, R.: Probability in high dimension. Technical report, PRINCETON UNIV NJ (2014)","DOI":"10.21236\/ADA623999"},{"key":"10657_CR81","doi-asserted-by":"crossref","unstructured":"Villani, C.: Optimal Transport: Old and New vol. 338. Springer (2009)","DOI":"10.1007\/978-3-540-71050-9"},{"key":"10657_CR82","unstructured":"Virmaux, A., Scaman, K.: Lipschitz regularity of deep neural networks: analysis and efficient estimation. Advances in Neural Information Processing Systems 31 (2018)"},{"issue":"2","key":"10657_CR83","first-page":"1","volume":"61","author":"S Wojtowytsch","year":"2022","unstructured":"Wojtowytsch, S.: Representation formulas and pointwise properties for barron functions. Calc. Var. Partial. Differ. Equ. 61(2), 1\u201337 (2022)","journal-title":"Calc. Var. Partial. Differ. Equ."},{"key":"10657_CR84","unstructured":"Weed, J., Bach, F.R.: Sharp asymptotic and finite-sample rates of convergence of empirical measures in wasserstein distance. Bernoulli (2017)"},{"key":"10657_CR85","doi-asserted-by":"crossref","unstructured":"Wei, R., Garcia, C., El-Sayed, A., Peterson, V., Mahmood, A.: Variations in variational autoencoders - a comparative evaluation. IEEE Access 8 (2020)","DOI":"10.1109\/ACCESS.2020.3018151"},{"key":"10657_CR86","doi-asserted-by":"publisher","first-page":"103","DOI":"10.1016\/j.neunet.2017.07.002","volume":"94","author":"D Yarotsky","year":"2017","unstructured":"Yarotsky, D.: Error bounds for approximations with deep relu networks. Neural Netw. 94, 103\u2013114 (2017)","journal-title":"Neural Netw."},{"key":"10657_CR87","unstructured":"Yarotsky, D.: Optimal approximation of continuous functions by very deep relu networks. In: Conference on Learning Theory, pp. 639\u2013649 (2018). PMLR"},{"key":"10657_CR88","doi-asserted-by":"crossref","unstructured":"Yang, Y., Li, Z., Wang, Y.: On the capacity of deep generative networks for approximating distributions. Neural networks 145 (2022)","DOI":"10.1016\/j.neunet.2021.10.012"},{"issue":"4","key":"10657_CR89","doi-asserted-by":"publisher","first-page":"2256","DOI":"10.1214\/22-AOS2186","volume":"50","author":"B Zhu","year":"2022","unstructured":"Zhu, B., Jiao, J., Steinhardt, J.: Generalized resilience and robust statistics. Ann. Stat. 50(4), 2256\u20132283 (2022)","journal-title":"Ann. Stat."}],"container-title":["Statistics and Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11222-025-10657-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11222-025-10657-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11222-025-10657-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,6]],"date-time":"2025-09-06T18:13:11Z","timestamp":1757182391000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11222-025-10657-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,6]]},"references-count":89,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2025,10]]}},"alternative-id":["10657"],"URL":"https:\/\/doi.org\/10.1007\/s11222-025-10657-z","relation":{},"ISSN":["0960-3174","1573-1375"],"issn-type":[{"type":"print","value":"0960-3174"},{"type":"electronic","value":"1573-1375"}],"subject":[],"published":{"date-parts":[[2025,6,6]]},"assertion":[{"value":"18 August 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 May 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 June 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"All codes, along with implementation details, can be found in the following repository .","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Code availability"}}],"article-number":"114"}}