{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,11]],"date-time":"2026-01-11T01:20:07Z","timestamp":1768094407377,"version":"3.49.0"},"reference-count":49,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/100000183","name":"Army Research Office","doi-asserted-by":"publisher","award":["W911NF-18-1-0345"],"award-info":[{"award-number":["W911NF-18-1-0345"]}],"id":[{"id":"10.13039\/100000183","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Mach Learn"],"published-print":{"date-parts":[[2025,11]]},"DOI":"10.1007\/s10994-025-06908-9","type":"journal-article","created":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T16:31:15Z","timestamp":1760891475000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Squared Wasserstein-2 loss functions for efficient learning of stochastic differential equations"],"prefix":"10.1007","volume":"114","author":[{"given":"Mingtao","family":"Xia","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiangting","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qijing","family":"Shen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tom","family":"Chou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,10,19]]},"reference":[{"key":"6908_CR1","unstructured":"Arjovsky, M., Chintala, S., & Bottou, L. (2017). Wasserstein generative adversarial networks. In: International conference on machine learning, pp. 214\u2013223. PMLR"},{"key":"6908_CR2","unstructured":"Bartl, D., Beiglb\u00f6ck, M., & Pammer, G. (2021). The Wasserstein space of stochastic processes. arXiv preprint arXiv:2104.14245"},{"issue":"3","key":"6908_CR3","doi-asserted-by":"publisher","first-page":"1609","DOI":"10.1214\/18-aap1423","volume":"29","author":"J Bion-Nadal","year":"2019","unstructured":"Bion-Nadal, J., & Talay, D. (2019). On a Wasserstein-type distance between solutions to stochastic differential equations. The Annals of Applied Probability, 29(3), 1609\u20131639. https:\/\/doi.org\/10.1214\/18-aap1423","journal-title":"The Annals of Applied Probability"},{"key":"6908_CR4","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-319-08488-6","volume-title":"Stochastic processes in cell biology","author":"PC Bressloff","year":"2014","unstructured":"Bressloff, P. C. (2014). Stochastic Processes in Cell Biology (Vol. 41). Springer."},{"key":"6908_CR5","unstructured":"Briol, F.-X., Barp, A., Duncan, A.B., & Girolami, M. (2019). Statistical inference for generative models with maximum mean discrepancy. arXiv preprint arXiv:1906.05944"},{"key":"6908_CR6","unstructured":"Chen, R.T., Rubanova, Y., Bettencourt, J., & Duvenaud, D.K. (2018). Neural ordinary differential equations. In: Advances in neural information processing systems, vol. 31"},{"key":"6908_CR7","unstructured":"Chewi, S., Clancy, J., Le\u00a0Gouic, T., Rigollet, P., Stepaniants, G., & Stromme, A. (2021). Fast and smooth interpolation on Wasserstein space. In: International conference on artificial intelligence and statistics, pp. 3061\u20133069. PMLR"},{"key":"6908_CR8","unstructured":"Choulli, T., & Schweizer, M. (2024). New stochastic F ubini theorems. arXiv preprint https:\/\/arxiv.org\/abs\/2403.13791"},{"key":"6908_CR9","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-87859-1","volume-title":"Probability and stochastics","author":"E Cinlar","year":"2011","unstructured":"Cinlar, E. (2011). Probability and Stochastics. Springer."},{"issue":"1","key":"6908_CR10","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1090\/S0002-9939-07-09020-X","volume":"136","author":"P Clement","year":"2008","unstructured":"Clement, P., & Desch, W. (2008). An elementary proof of the triangle inequality for the Wasserstein metric. Proceedings of the American Mathematical Society, 136(1), 333\u2013339.","journal-title":"Proceedings of the American Mathematical Society"},{"key":"6908_CR11","unstructured":"Cuturi, M., Teboul, O., & Vert, J.-P. (2019). Differentiable ranks and sorting using optimal transport. In: Proceedings of the 33rd international conference on neural information processing systems, pp. 6861\u20136871"},{"issue":"1","key":"6908_CR12","first-page":"3571","volume":"22","author":"R Flamary","year":"2021","unstructured":"Flamary, R., Courty, N., Gramfort, A., Alaya, M. Z., Boisbunon, A., Chambon, S., Chapel, L., Corenflos, A., Fatras, K., Fournier, N., et al. (2021). Pot: python optimal transport. The Journal of Machine Learning Research, 22(1), 3571\u20133578.","journal-title":"The Journal of Machine Learning Research"},{"issue":"3\u20134","key":"6908_CR13","doi-asserted-by":"publisher","first-page":"707","DOI":"10.1007\/s00440-014-0583-7","volume":"162","author":"N Fournier","year":"2015","unstructured":"Fournier, N., & Guillin, A. (2015). On the rate of convergence in Wasserstein distance of the empirical measure. Probability Theory and Related Fields, 162(3\u20134), 707\u2013738.","journal-title":"Probability Theory and Related Fields"},{"key":"6908_CR14","unstructured":"Frogner, C., Zhang, C., Mobahi, H., Araya, M., & Poggio, T.A. (2015). Learning with a Wasserstein loss. In: Advances in neural information processing systems, vol. 28"},{"issue":"1362","key":"6908_CR15","doi-asserted-by":"publisher","first-page":"319","DOI":"10.1098\/rspb.1995.0153","volume":"261","author":"A Goldbeter","year":"1995","unstructured":"Goldbeter, A. (1995). A model for circadian oscillations in the Drosophila period protein (PER). Proceedings of the Royal Society of London Series B: Biological Sciences, 261(1362), 319\u2013324.","journal-title":"Proceedings of the Royal Society of London Series B: Biological Sciences"},{"key":"6908_CR16","first-page":"699","volume":"6","author":"D Gonze","year":"2011","unstructured":"Gonze, D. (2011). Modeling circadian clocks: From equations to oscillations. Central European Journal of Biology, 6, 699\u2013711.","journal-title":"Central European Journal of Biology"},{"issue":"6","key":"6908_CR17","doi-asserted-by":"publisher","first-page":"507","DOI":"10.1002\/asmb.709","volume":"24","author":"H Gzyl","year":"2008","unstructured":"Gzyl, H., Horst, E., & Malone, S. W. (2008). Bayesian parameter inference for models of the black and Scholes type. Applied Stochastic Models in Business and Industry, 24(6), 507\u2013524.","journal-title":"Applied Stochastic Models in Business and Industry"},{"key":"6908_CR18","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. (2016). Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"6908_CR19","volume-title":"Calcul stochastique et problemes de martingales","author":"J Jacod","year":"2006","unstructured":"Jacod, J. (2006). Calcul stochastique et problemes de martingales (Vol. 714). Springer."},{"key":"6908_CR20","unstructured":"Jia, J., & Benson, A.R. (2019). Neural jump stochastic differential equations. In: Advances in neural information processing systems32"},{"key":"6908_CR21","unstructured":"Kidger, P., Foster, J., Li, X., & Lyons, T.J. (2021). Neural SDEs as infinite-dimensional GANs. In: International conference on machine learning, pp. 5453\u20135463. PMLR"},{"key":"6908_CR22","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-662-12616-5","volume-title":"Numerical solution of stochastic differential equations","author":"PE Kloeden","year":"1992","unstructured":"Kloeden, P. E., & Platen, E. (1992). Numerical solution of stochastic differential equations. Springer."},{"key":"6908_CR23","unstructured":"Kolouri, S., Nadjahi, K., Simsekli, U., Badeau, R., & Rohde, G. (2019). Generalized sliced Wasserstein distances. In: Advances in neural information processing systems, vol. 32"},{"key":"6908_CR24","doi-asserted-by":"crossref","unstructured":"Kolouri, S., Rohde, G.K., & Hoffmann, H. (2018). Sliced Wasserstein distance for learning Gaussian mixture models. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 3427\u20133436","DOI":"10.1109\/CVPR.2018.00361"},{"key":"6908_CR25","unstructured":"Li, Y., Swersky, K., & Zemel, R. (2015). Generative moment matching networks. In: International conference on machine learning, pp. 1718\u20131727. PMLR"},{"key":"6908_CR26","unstructured":"Li, X., Wong, T.-K.L., Chen, R.T., & Duvenaud, D. (2020). Scalable gradients for stochastic differential equations. In: International conference on artificial intelligence and statistics, pp. 3870\u20133882. PMLR"},{"issue":"138","key":"6908_CR27","doi-asserted-by":"publisher","first-page":"20170804","DOI":"10.1098\/rsif.2017.0804","volume":"15","author":"YT Lin","year":"2018","unstructured":"Lin, Y. T., & Buchler, N. E. (2018). Efficient analysis of stochastic gene dynamics in the non-adiabatic regime using piecewise deterministic Markov processes. Journal of The Royal Society Interface, 15(138), 20170804.","journal-title":"Journal of The Royal Society Interface"},{"issue":"11","key":"6908_CR28","doi-asserted-by":"publisher","first-page":"4405","DOI":"10.1109\/TNNLS.2019.2957109","volume":"31","author":"H Liu","year":"2020","unstructured":"Liu, H., Ong, Y.-S., Shen, X., & Cai, J. (2020). When Gaussian process meets big data: a review of scalable GPs . IEEE Transactions on Neural Networks and Learning Systems, 31(11), 4405\u20134423.","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"key":"6908_CR29","first-page":"133","volume":"168","author":"DJ MacKay","year":"1998","unstructured":"MacKay, D. J., et al. (1998). Introduction to Gaussian processes. NATO ASI Series F Computer and Systems Sciences, 168, 133\u2013166.","journal-title":"NATO ASI Series F Computer and Systems Sciences"},{"key":"6908_CR30","doi-asserted-by":"publisher","first-page":"209","DOI":"10.1007\/s11075-004-2866-z","volume":"38","author":"L Mathelin","year":"2005","unstructured":"Mathelin, L., Hussaini, M. Y., & Zang, T. A. (2005). Stochastic approaches to uncertainty quantification in cfd simulations. Numerical Algorithms, 38, 209\u2013236.","journal-title":"Numerical Algorithms"},{"key":"6908_CR31","doi-asserted-by":"crossref","unstructured":"Musiela, M., & Rutkowski, M. (2006). Martingale methods in financial modelling vol. 36. Springer","DOI":"10.1007\/b137866"},{"key":"6908_CR32","unstructured":"Oh, J.H., Pouryahya, M., Iyer, A., Apte, A.P., Tannenbaum, A., & Deasy, J.O. (2019). Kernel Wasserstein distance. arXiv preprint arXiv:1905.09314"},{"key":"6908_CR33","unstructured":"Pereira, J., Ibrahimi, M., & Montanari, A. (2010). Learning networks of stochastic differential equations. In: Advances in neural information processing systems, vol. 23"},{"key":"6908_CR34","unstructured":"Rowland, M., Hron, J., Tang, Y., Choromanski, K., Sarlos, T., & Weller, A. (2019). Orthogonal estimation of Wasserstein distances. In: The 22nd International conference on artificial intelligence and statistics, pp. 186\u2013195. PMLR"},{"issue":"1","key":"6908_CR35","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1007\/BF00532240","volume":"70","author":"L R\u00fcschendorf","year":"1985","unstructured":"R\u00fcschendorf, L. (1985). The Wasserstein distance and approximation theorems. Probability Theory and Related Fields, 70(1), 117\u2013129.","journal-title":"Probability Theory and Related Fields"},{"issue":"1","key":"6908_CR36","first-page":"11006","volume":"22","author":"JM Sanz-Serna","year":"2021","unstructured":"Sanz-Serna, J. M., & Zygalakis, K. C. (2021). Wasserstein distance estimates for the distributions of numerical approximations to ergodic stochastic differential equations. The Journal of Machine Learning Research, 22(1), 11006\u201311042.","journal-title":"The Journal of Machine Learning Research"},{"key":"6908_CR37","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-54339-0","volume-title":"Uncertainty quantification","author":"C Soize","year":"2017","unstructured":"Soize, C. (2017). Uncertainty quantification. Springer."},{"key":"6908_CR38","unstructured":"Song, Y., Sohl-Dickstein, J., Kingma, D.P., Kumar, A., Ermon, S., & Poole, B. (2020). Score-based generative modeling through stochastic differential equations. In: International conference on learning representations"},{"key":"6908_CR39","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-319-23395-6","volume-title":"Introduction to uncertainty quantification","author":"TJ Sullivan","year":"2015","unstructured":"Sullivan, T. J. (2015). Introduction to uncertainty quantification (Vol. 63). Springer."},{"key":"6908_CR40","first-page":"37660","volume":"35","author":"A Tong","year":"2022","unstructured":"Tong, A., Nguyen-Tang, T., Tran, T., & Choi, J. (2022). Learning fractional white noises in neural stochastic differential equations. Advances in Neural Information Processing Systems, 35, 37660\u201337675.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"6908_CR41","unstructured":"Tzen, B., & Raginsky, M. (2019). Neural stochastic differential equations: deep latent Gaussian models in the diffusion limit. arXiv preprint arXiv:1905.09883"},{"issue":"12","key":"6908_CR42","doi-asserted-by":"publisher","DOI":"10.1063\/1.4973197","volume":"57","author":"FC Vecchi","year":"2016","unstructured":"Vecchi, F. C., Morando, P., & Ugolini, S. (2016). Reduction and reconstruction of stochastic differential equations via symmetries. Journal of Mathematical Physics, 57(12), Article 123508.","journal-title":"Journal of Mathematical Physics"},{"key":"6908_CR43","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-540-71050-9","volume-title":"Optimal transport: Old and new","author":"C Villani","year":"2009","unstructured":"Villani, C., et al. (2009). Optimal transport: Old and new (Vol. 338). Springer."},{"key":"6908_CR44","doi-asserted-by":"crossref","unstructured":"Wang, J. (2016). $${L}^{p}$$-Wasserstein distance for stochastic differential equations driven by L\u00e9vy processes. Bernoulli, pp. 1598\u20131616","DOI":"10.3150\/15-BEJ705"},{"key":"6908_CR45","doi-asserted-by":"crossref","unstructured":"Welch, G.F. (2020). Kalman filter. Computer vision: A reference guide, pp. 1\u20133","DOI":"10.1007\/978-3-030-03243-2_716-1"},{"key":"6908_CR46","unstructured":"Welch, G., Bishop, G., et al. (1995). An introduction to the Kalman filter"},{"issue":"11","key":"6908_CR47","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1371\/journal.pcbi.1000580","volume":"5","author":"PO Westermark","year":"2009","unstructured":"Westermark, P. O., Welsh, D. K., Okamura, H., & Herzel, H. (2009). Quantification of circadian rhythms in single cells. PLOS Computational Biology, 5(11), 1\u201310. https:\/\/doi.org\/10.1371\/journal.pcbi.1000580","journal-title":"PLOS Computational Biology"},{"key":"6908_CR48","doi-asserted-by":"crossref","unstructured":"Xia, M., Li, X., Shen, Q., & Chou, T. (2024). An efficient Wasserstein-distance approach for reconstructing jump-diffusion processes using parameterized neural networks. Machine Learning: Science and Technology, 5(4), pp. 045052.","DOI":"10.1088\/2632-2153\/ad9379"},{"key":"6908_CR49","doi-asserted-by":"crossref","unstructured":"Zheng, W., Wang, F.-Y., & Gou, C. (2020). Nonparametric different-feature selection using Wasserstein distance. In: 2020 IEEE 32nd international conference on tools with artificial intelligence (ICTAI), pp. 982\u2013988. IEEE","DOI":"10.1109\/ICTAI50040.2020.00153"}],"container-title":["Machine Learning"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10994-025-06908-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10994-025-06908-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10994-025-06908-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,2]],"date-time":"2025-12-02T14:29:33Z","timestamp":1764685773000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10994-025-06908-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,19]]},"references-count":49,"journal-issue":{"issue":"11","published-print":{"date-parts":[[2025,11]]}},"alternative-id":["6908"],"URL":"https:\/\/doi.org\/10.1007\/s10994-025-06908-9","relation":{},"ISSN":["0885-6125","1573-0565"],"issn-type":[{"value":"0885-6125","type":"print"},{"value":"1573-0565","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,10,19]]},"assertion":[{"value":"3 July 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 July 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 September 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 October 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"No competing and financial interests to disclose.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}},{"value":"Not applicable.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent to participate"}},{"value":"Not applicable.","order":5,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}}],"article-number":"255"}}