{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,3]],"date-time":"2026-06-03T03:21:38Z","timestamp":1780456898476,"version":"3.54.1"},"reference-count":67,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2022,7,9]],"date-time":"2022-07-09T00:00:00Z","timestamp":1657324800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,7,9]],"date-time":"2022-07-09T00:00:00Z","timestamp":1657324800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["DMS-2015498"],"award-info":[{"award-number":["DMS-2015498"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R01-GM126089"],"award-info":[{"award-number":["R01-GM126089"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["DMS-2053746"],"award-info":[{"award-number":["DMS-2053746"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000015","name":"U.S. Department of Energy","doi-asserted-by":"publisher","award":["DE-SC0021142"],"award-info":[{"award-number":["DE-SC0021142"]}],"id":[{"id":"10.13039\/100000015","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100006231","name":"Brookhaven National Laboratory","doi-asserted-by":"publisher","award":["subcontract 382247"],"award-info":[{"award-number":["subcontract 382247"]}],"id":[{"id":"10.13039\/100006231","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R01-GM117597"],"award-info":[{"award-number":["R01-GM117597"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Stat Comput"],"published-print":{"date-parts":[[2022,8]]},"DOI":"10.1007\/s11222-022-10120-3","type":"journal-article","created":{"date-parts":[[2022,7,9]],"date-time":"2022-07-09T09:02:27Z","timestamp":1657357347000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["An adaptively weighted stochastic gradient MCMC algorithm for Monte Carlo simulation and global optimization"],"prefix":"10.1007","volume":"32","author":[{"given":"Wei","family":"Deng","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Guang","family":"Lin","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1177-5501","authenticated-orcid":false,"given":"Faming","family":"Liang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2022,7,9]]},"reference":[{"key":"10120_CR1","unstructured":"Ahn, S., Balan, A.K., Welling, M.: Bayesian posterior sampling via stochastic gradient fisher scoring. In: International Conference on Machine Learning (ICML) (2012a)"},{"key":"10120_CR2","unstructured":"Ahn, S., Korattikara, A., Welling, M.: Bayesian posterior sampling via stochastic gradient fisher scoring. In: International Conference on Machine Learning (ICML) (2012b)"},{"key":"10120_CR3","unstructured":"Aitchison, L.: A statistical theory of cold posteriors in deep neural networks. In: International Conference on Learning Representation (ICLR) (2021)"},{"key":"10120_CR4","doi-asserted-by":"publisher","first-page":"283","DOI":"10.1137\/S0363012902417267","volume":"44","author":"C Andrieu","year":"2005","unstructured":"Andrieu, C., Moulines, E., Priouret, P.: Stability of stochastic approximation under verifiable conditions. SIAM J. Control Optim. 44, 283\u2013312 (2005)","journal-title":"SIAM J. Control Optim."},{"key":"10120_CR5","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1017\/S0962492921000039","volume":"30","author":"M Belkin","year":"2021","unstructured":"Belkin, M.: Fit without fear: remarkable mathematical phenomena of deep learning through the prism of interpolation. Acta Numer. 30, 203\u2013248 (2021)","journal-title":"Acta Numer."},{"key":"10120_CR6","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-75894-2","volume-title":"Adaptive Algorithms and Stochastic Approximations","author":"A Benveniste","year":"1990","unstructured":"Benveniste, A., M\u00e9tivier, M., Priouret, P.: Adaptive Algorithms and Stochastic Approximations. Springer, Berlin (1990)"},{"key":"10120_CR7","doi-asserted-by":"publisher","first-page":"249","DOI":"10.1016\/0370-2693(91)91256-U","volume":"267","author":"BA Berg","year":"1991","unstructured":"Berg, B.A., Neuhaus, T.: Multicanonical algorithms for first order phase transitions. Phys. Lett. B 267, 249\u2013253 (1991)","journal-title":"Phys. Lett. B"},{"key":"10120_CR8","unstructured":"Chen, C., Carlson, D., Gan, Z., Li, C., Carin, L.: Bridging the gap between stochastic gradient MCMC and stochastic optimization. In: International Conference on Artificial Intelligence and Statistics, AISTATS 2016 (2016)"},{"key":"10120_CR9","unstructured":"Chen, C., Ding, N., Carin, L.: On the convergence of stochastic gradient MCMC algorithms with high-order integrators. In: Advances in Neural Information Processing Systems (NIPS) (2015)"},{"key":"10120_CR10","unstructured":"Chen, T., Fox, E.B., Guestrin, C.: Stochastic gradient Hamiltonian Monte Carlo. In: International Conference on Machine Learning (ICML) (2014)"},{"key":"10120_CR11","unstructured":"Chen, Y., Chen, J., Dong, J., Peng, J., Wang, Z.: Accelerating nonconvex learning via replica exchange Langevin diffusion. In: International Conference on Learning Representation (ICLR) (2019)"},{"key":"10120_CR12","unstructured":"Deng, W., Feng, Q., Gao, L., Liang, F., Lin, G.: Non-convex learning via replica exchange stochastic gradient MCMC. In: International Conference on Machine Learning (ICML) (2020a)"},{"key":"10120_CR13","unstructured":"Deng, W., Feng, Q., Karagiannis, G., Lin, G., Liang, F.: Accelerating convergence of replica exchange stochastic gradient MCMC via variance reduction. In: International Conference on Learning Representation (ICLR) (2021)"},{"key":"10120_CR14","unstructured":"Deng, W., Lin, G., Liang, F.: A contour stochastic gradient langevin dynamics algorithm for simulations of multi-modal distributions. In: Advances in Neural Information Processing Systems (NeurIPS) (2020b)"},{"key":"10120_CR15","unstructured":"Ding, N., Fang, Y., Babbush, R., Chen, C., Skeel, R.D., Neven, H.: Bayesian sampling using stochastic gradient thermostats. In: Advances in Neural Information Processing Systems (NeurIPS) (2014)"},{"key":"10120_CR16","unstructured":"Erdogdu, M.A., Mackey, L., Shamir, O.: Global non-convex optimization with discretized diffusions. In: Advances in Neural Information Processing Systems (NeurIPS) (2018)"},{"key":"10120_CR17","doi-asserted-by":"publisher","first-page":"2297","DOI":"10.1090\/S0025-5718-2015-02952-4","volume":"84","author":"G Fort","year":"2015","unstructured":"Fort, G., Jourdain, B., Kuhn, E., Leli\u00e8vre, T., Stoltz, G.: Convergence of the Wang\u2013Landau algorithm. Math. Comput. 84, 2297\u20132327 (2015)","journal-title":"Math. Comput."},{"key":"10120_CR18","unstructured":"Geyer, C.J.: Markov chain Monte Carlo maximum likelihood. In: Computing Science and Statistics: Proceedings of the 23rd Symposium on the Interface, pp. 156\u2013163 (1991)"},{"key":"10120_CR19","doi-asserted-by":"publisher","first-page":"909","DOI":"10.1080\/01621459.1995.10476590","volume":"90","author":"CJ Geyer","year":"1995","unstructured":"Geyer, C.J., Thompson, E.A.: Annealing Markov Chain Monte Carlo with applications to ancestral inference. J. Am. Stat. Assoc. 90, 909\u2013920 (1995)","journal-title":"J. Am. Stat. Assoc."},{"key":"10120_CR20","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1111\/j.1467-9868.2010.00765.x","volume":"73","author":"M Girolami","year":"2011","unstructured":"Girolami, M., Calderhead, B.: Riemann manifold Langevin and Hamiltonian Monte Carlo methods (with discussion). J. R. Stat. Soc. B 73, 123\u2013214 (2011)","journal-title":"J. R. Stat. Soc. B"},{"key":"10120_CR21","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1093\/biomet\/57.1.97","volume":"57","author":"W Hastings","year":"1970","unstructured":"Hastings, W.: Monte Carlo sampling methods using Markov Chain and their applications. Biometrika 57, 97\u2013109 (1970)","journal-title":"Biometrika"},{"key":"10120_CR22","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: The IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2016)","DOI":"10.1109\/CVPR.2016.90"},{"issue":"12","key":"10120_CR23","doi-asserted-by":"publisher","first-page":"2151","DOI":"10.1103\/PhysRevLett.74.2151","volume":"74","author":"B Hesselbo","year":"1995","unstructured":"Hesselbo, B., Stinchcombe, R.: Monte Carlo simulation and global optimization without parameters. Phys. Rev. Lett. 74(12), 2151\u20132155 (1995)","journal-title":"Phys. Rev. Lett."},{"key":"10120_CR24","doi-asserted-by":"crossref","unstructured":"Jarrett, K., Kavukcuoglu, K., Ranzato, M., LeCun, Y.: What is the best multi-stage architecture for object recognition? In: International Conference on Computer Vision (ICCV) (2009)","DOI":"10.1109\/ICCV.2009.5459469"},{"key":"10120_CR25","doi-asserted-by":"publisher","first-page":"671","DOI":"10.1126\/science.220.4598.671","volume":"220","author":"S Kirkpatrick","year":"1983","unstructured":"Kirkpatrick, S., Gelatt, C.D., Jr., Vecchi, M.P.: Optimization by simulated annealing. Science 220, 671\u2013680 (1983)","journal-title":"Science"},{"key":"10120_CR26","doi-asserted-by":"publisher","first-page":"235","DOI":"10.1007\/s10898-004-1936-z","volume":"33","author":"M Laguna","year":"2005","unstructured":"Laguna, M., Mart\u00ed, R.: Experimental testing of advanced scatter search designs for global optimization of multimodal functions. J. Glob. Optim. 33, 235\u2013255 (2005)","journal-title":"J. Glob. Optim."},{"key":"10120_CR27","doi-asserted-by":"publisher","first-page":"2278","DOI":"10.1109\/5.726791","volume":"86","author":"Y LeCun","year":"1998","unstructured":"LeCun, Y., Bottou, L., Bengio, Y., Haffner, P.: Gradient-based learning applied to document recognition. Proc. IEEE 86, 2278\u20132324 (1998)","journal-title":"Proc. IEEE"},{"key":"10120_CR28","doi-asserted-by":"crossref","unstructured":"Li, C., Chen, C., Carlson, D.E., Carin, L.: Preconditioned stochastic gradient Langevin dynamics for deep neural networks. In: AAAI Conference on Artificial Intelligence (AAAI) (2016)","DOI":"10.1609\/aaai.v30i1.10200"},{"key":"10120_CR29","doi-asserted-by":"publisher","first-page":"66701","DOI":"10.1103\/PhysRevE.69.066701","volume":"69","author":"F Liang","year":"2004","unstructured":"Liang, F.: Generalized 1\/k-ensemble algorithm. Phys. Rev. E 69, 66701\u201366707 (2004)","journal-title":"Phys. Rev. E"},{"key":"10120_CR30","doi-asserted-by":"publisher","first-page":"1311","DOI":"10.1198\/016214505000000259","volume":"100","author":"F Liang","year":"2005","unstructured":"Liang, F.: A generalized Wang\u2013Landau algorithm for Monte Carlo computation. J. Am. Stat. Assoc. 100, 1311\u20131327 (2005)","journal-title":"J. Am. Stat. Assoc."},{"key":"10120_CR31","doi-asserted-by":"publisher","first-page":"608","DOI":"10.1198\/106186007X238459","volume":"16","author":"F Liang","year":"2007","unstructured":"Liang, F.: Continuous contour Monte Carlo for marginal density estimation with an application to a spatial statistical model. J. Comput. Graph. Stat. 16, 608\u2013632 (2007)","journal-title":"J. Comput. Graph. Stat."},{"key":"10120_CR32","doi-asserted-by":"publisher","first-page":"581","DOI":"10.1016\/j.spl.2008.10.007","volume":"79","author":"F Liang","year":"2009","unstructured":"Liang, F.: On the use of stochastic approximation Monte Carlo for Monte Carlo integration. Stat. Probab. Lett. 79, 581\u2013587 (2009)","journal-title":"Stat. Probab. Lett."},{"key":"10120_CR33","doi-asserted-by":"publisher","first-page":"305","DOI":"10.1198\/016214506000001202","volume":"102","author":"F Liang","year":"2007","unstructured":"Liang, F., Liu, C., Carroll, R.J.: Stochastic approximation in Monte Carlo computation. J. Am. Stat. Assoc. 102, 305\u2013320 (2007)","journal-title":"J. Am. Stat. Assoc."},{"key":"10120_CR34","doi-asserted-by":"crossref","unstructured":"Liu, C., Zhu, L., Belkin, M.: Loss landscapes and optimization in over-parameterized non-linear systems and neural networks (2021). arXiv:2003.00307v2","DOI":"10.1016\/j.acha.2021.12.009"},{"key":"10120_CR35","unstructured":"Lu, X., Perrone, V., Hasenclever, L., Teh, Y.W., Vollmer, S.: Relativistic Monte Carlo. In: the 20th International Conference on Artificial Intelligence and Statistics (2017)"},{"key":"10120_CR36","unstructured":"Ma, Y.-A., Chen, T., Fox, E.B.: A complete recipe for stochastic gradient MCMC. In: Advances in Neural Information Processing Systems (NeurIPS) (2015)"},{"key":"10120_CR37","unstructured":"Maddox, W., Garipov, T., Izmailov, P., Vetrov, D., Wilson, A.G. A simple baseline for Bayesian uncertainty in deep learning. In: Advances in Neural Information Processing Systems (NeurIPS) (2019)"},{"key":"10120_CR38","unstructured":"Mangoubi, O., Vishnoi, N.K.: Convex optimization with unbounded nonconvex oracles using simulated annealing. In: Conference on Learning Theory (COLT) (2018)"},{"key":"10120_CR39","doi-asserted-by":"publisher","first-page":"451","DOI":"10.1209\/0295-5075\/19\/6\/002","volume":"19","author":"E Marinari","year":"1992","unstructured":"Marinari, E., Parisi, G.: Simulated tempering: a new Monte Carlo scheme. Europhys. Lett. 19, 451\u2013458 (1992)","journal-title":"Europhys. Lett."},{"key":"10120_CR40","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1016\/S0304-4149(02)00150-3","volume":"101","author":"J Mattingly","year":"2002","unstructured":"Mattingly, J., Stuartb, A., Highamc, D.: Ergodicity for SDEs and approximations: locally Lipschitz vector fields and degenerate noise. Stoch. Process. Appl. 101, 185\u2013232 (2002)","journal-title":"Stoch. Process. Appl."},{"key":"10120_CR41","doi-asserted-by":"publisher","first-page":"552","DOI":"10.1137\/090770527","volume":"48","author":"JC Mattingly","year":"2010","unstructured":"Mattingly, J.C., Stuart, A.M., Tretyakov, M.: Convergence of numerical time-averaging and stationary measures via Poisson equations. SIAM J. Numer. Anal. 48, 552\u2013577 (2010)","journal-title":"SIAM J. Numer. Anal."},{"key":"10120_CR42","doi-asserted-by":"publisher","first-page":"1087","DOI":"10.1063\/1.1699114","volume":"21","author":"N Metropolis","year":"1953","unstructured":"Metropolis, N., Rosenbluth, A., Rosenbluth, M., Teller, A., Teller, E.: Equation of state calculations by fast computing machines. J. Chem. Phys. 21, 1087\u20131091 (1953)","journal-title":"J. Chem. Phys."},{"key":"10120_CR43","first-page":"113","volume-title":"MCMC Using Hamiltonian Dynamics. Handbook of Markov Chain Monte Carlo","author":"RM Neal","year":"2012","unstructured":"Neal, R.M.: MCMC Using Hamiltonian Dynamics. Handbook of Markov Chain Monte Carlo, vol. 54, pp. 113\u2013162. Chapman & Hall\/CRC, London (2012)"},{"key":"10120_CR44","doi-asserted-by":"publisher","first-page":"433","DOI":"10.1080\/01621459.2020.1847120","volume":"116","author":"C Nemeth","year":"2021","unstructured":"Nemeth, C., Fearnhead, P.: Stochastic gradient Markov Chain Monte Carlo. J. Am. Stat. Assoc. 116, 433\u2013450 (2021)","journal-title":"J. Am. Stat. Assoc."},{"key":"10120_CR45","unstructured":"Patterson, S., Teh, Y.W.: Stochastic gradient Riemannian Langevin dynamics on the probability simplex. In: Proceedings of the 26th International Conference on Neural Information Processing Systems, vol. 2, pp. 3102\u20133110. NIPS\u201913. Curran Associates Inc, Red Hook (2013)"},{"key":"10120_CR46","unstructured":"PyTorch. CyclicLR in PyTorch (2019). https:\/\/pytorch.org\/docs\/stable\/generated\/torch.optim.lr_scheduler.CyclicLR.html"},{"key":"10120_CR47","first-page":"1","volume":"65","author":"M Raginsky","year":"2017","unstructured":"Raginsky, M., Rakhlin, A., Telgarsky, M.: Non-convex learning via stochastic gradient Langevin dynamics: a nonasymptotic analysis. Proc. Mach. Learn. Res. 65, 1\u201330 (2017)","journal-title":"Proc. Mach. Learn. Res."},{"key":"10120_CR48","doi-asserted-by":"publisher","first-page":"400","DOI":"10.1214\/aoms\/1177729586","volume":"22","author":"H Robbins","year":"1951","unstructured":"Robbins, H., Monro, S.: A stochastic approximation method. Ann. Math. Stat. 22, 400\u2013407 (1951)","journal-title":"Ann. Math. Stat."},{"key":"10120_CR49","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4757-4145-2","volume-title":"Monte Carlo Statistical Methods","author":"C Robert","year":"2004","unstructured":"Robert, C., Casella, G.: Monte Carlo Statistical Methods. Springer, Berlin (2004)"},{"key":"10120_CR50","doi-asserted-by":"publisher","first-page":"341","DOI":"10.2307\/3318418","volume":"2","author":"GO Roberts","year":"1996","unstructured":"Roberts, G.O., Tweedie, R.L.: Exponential convergence of Langevin distributions and their discrete approximations. Bernoulli 2, 341\u2013363 (1996)","journal-title":"Bernoulli"},{"key":"10120_CR51","unstructured":"Saatci, Y., Wilson, A.G.: Bayesian GAN. In: Advances in Neural Information Processing Systems (NIPS), pp. 3622\u20133631 (2017)"},{"key":"10120_CR52","unstructured":"Sato, I., Nakagawa, H.: Approximation analysis of stochastic gradient Langevin dynamics by using Fokker\u2013Planck equation and ito process. In: International Conference on Machine Learning (ICML) (2014)"},{"key":"10120_CR53","unstructured":"Simsekli, U., Badeau, R., Cemgil, T., Richard, G.: Stochastic quasi-Newton Langevin Monte Carlo. In: International Conference on Machine Learning, vol. 48 (2016)"},{"key":"10120_CR54","doi-asserted-by":"crossref","unstructured":"Smith, L.N.: Cyclical learning rates for training neural networks. In: 2017 Winter Conference on Applications of Computer Vision (2017)","DOI":"10.1109\/WACV.2017.58"},{"key":"10120_CR55","doi-asserted-by":"publisher","first-page":"2607","DOI":"10.1103\/PhysRevLett.57.2607","volume":"57","author":"RH Swendsen","year":"1986","unstructured":"Swendsen, R.H., Wang, J.-S.: Replica Monte Carlo simulation of spin-glasses. Phys. Rev. Lett. 57, 2607\u20132609 (1986)","journal-title":"Phys. Rev. Lett."},{"key":"10120_CR56","unstructured":"TensorFlow. TensorFlow Addons Optimizers: CyclicalLearningRate (2021). https:\/\/www.tensorflow.org\/addons\/tutorials\/optimizers_cyclicallearningrate"},{"key":"10120_CR57","first-page":"1","volume":"17","author":"SJ Vollmer","year":"2016","unstructured":"Vollmer, S.J., Zygalakis, K.C., Teh, Y.W.: Exploration of the (non-)asymptotic bias and variance of stochastic gradient Langevin dynamics. J. Mach. Learn. Res. 17, 1\u201348 (2016)","journal-title":"J. Mach. Learn. Res."},{"key":"10120_CR58","doi-asserted-by":"publisher","first-page":"2050","DOI":"10.1103\/PhysRevLett.86.2050","volume":"86","author":"F Wang","year":"2001","unstructured":"Wang, F., Landau, D.P.: Efficient, multiple-range random walk algorithm to calculate the density of states. Phys. Rev. Lett. 86, 2050\u20132053 (2001)","journal-title":"Phys. Rev. Lett."},{"key":"10120_CR59","unstructured":"Weinhart, T., Singh, A., Thornton, A.: Perturbation theory & stability analysis. Slides (2010)"},{"key":"10120_CR60","unstructured":"Welling, M., Teh, Y.W.: Bayesian learning via stochastic gradient langevin dynamics. In: International Conference on Machine Learning (ICML) (2011)"},{"key":"10120_CR61","unstructured":"Wenzel, F., Roth, K., Veeling, B.S., \u015awiatkowski, J., Tran, L., Mandt, S., Snoek, J., Salimans, T., Jenatton, R., Nowozin, S.: How good is the Bayes posterior in deep neural networks really? In: International Conference on Machine Learning (ICML) (2020)"},{"key":"10120_CR62","unstructured":"Xu, P., Chen, J., Zou, D., Gu, Q.: Global convergence of langevin dynamics based algorithms for nonconvex optimization. In: Advances in Neural Information Processing Systems (NIPS) (2018)"},{"key":"10120_CR63","unstructured":"Ye, N., Zhu, Z., Mantiuk, R.K.: Langevin dynamics with continuous tempering for training deep neural networks. In: Proceedings of the 31st International Conference on Neural Information Processing Systems, NIPS\u201917, pp. 618\u2013626. Curran Associates Inc., Red Hook (2017)"},{"key":"10120_CR64","doi-asserted-by":"crossref","unstructured":"Zagoruyko, S., Komodakis, N.: Wide residual networks. In: Proceedings of the British Machine Vision Conference (BMVC), pp. 87.1\u201387.12 (2016)","DOI":"10.5244\/C.30.87"},{"key":"10120_CR65","unstructured":"Zhang, R., Li, C., Zhang, J., Chen, C., Wilson, A.G.: Cyclical stochastic gradient MCMC for Bayesian deep learning. In: International Conference on Learning Representation (ICLR) (2020)"},{"key":"10120_CR66","doi-asserted-by":"crossref","unstructured":"Zhang, X., Jiang, Y., Peng, H., Tu, K., Goldwasser, D.: Semi-supervised structured prediction with neural CRF autoencoder. In: Conference on Empirical Methods for Natural Language Processing (EMNLP), pp. 1701\u20131711 (2017)","DOI":"10.18653\/v1\/D17-1179"},{"key":"10120_CR67","doi-asserted-by":"crossref","unstructured":"Zhong, Z., Zheng, L., Kang, G., Li, S., Yang, Y.: Random erasing data augmentation. In: AAAI Conference on Artificial Intelligence, vol. 34 (2020)","DOI":"10.1609\/aaai.v34i07.7000"}],"container-title":["Statistics and Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11222-022-10120-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11222-022-10120-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11222-022-10120-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,25]],"date-time":"2022-08-25T19:20:49Z","timestamp":1661455249000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11222-022-10120-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,7,9]]},"references-count":67,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2022,8]]}},"alternative-id":["10120"],"URL":"https:\/\/doi.org\/10.1007\/s11222-022-10120-3","relation":{},"ISSN":["0960-3174","1573-1375"],"issn-type":[{"value":"0960-3174","type":"print"},{"value":"1573-1375","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,7,9]]},"assertion":[{"value":"1 September 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 June 2022","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 July 2022","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"58"}}