{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,25]],"date-time":"2026-04-25T12:57:38Z","timestamp":1777121858658,"version":"3.51.4"},"reference-count":45,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2019,11,1]],"date-time":"2019-11-01T00:00:00Z","timestamp":1572566400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2019,11,1]],"date-time":"2019-11-01T00:00:00Z","timestamp":1572566400000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/100000181","name":"AFOSR","doi-asserted-by":"crossref","award":["FA9550-17-1-0125"],"award-info":[{"award-number":["FA9550-17-1-0125"]}],"id":[{"id":"10.13039\/100000181","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["CAREER grant #1752116"],"award-info":[{"award-number":["CAREER grant #1752116"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Math Imaging Vis"],"published-print":{"date-parts":[[2020,4]]},"DOI":"10.1007\/s10851-019-00922-y","type":"journal-article","created":{"date-parts":[[2019,11,1]],"date-time":"2019-11-01T17:04:39Z","timestamp":1572627879000},"page":"328-351","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":42,"title":["Forward Stability of ResNet and Its Variants"],"prefix":"10.1007","volume":"62","author":[{"given":"Linan","family":"Zhang","sequence":"first","affiliation":[]},{"given":"Hayden","family":"Schaeffer","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,11,1]]},"reference":[{"issue":"1","key":"922_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1561\/2200000006","volume":"2","author":"Y Bengio","year":"2009","unstructured":"Bengio, Y.: Learning deep architectures for AI. Found. Trends. Mach. Learn. 2(1), 1\u2013127 (2009)","journal-title":"Found. Trends. Mach. Learn."},{"issue":"2","key":"922_CR2","doi-asserted-by":"publisher","first-page":"157","DOI":"10.1109\/72.279181","volume":"5","author":"Y Bengio","year":"1994","unstructured":"Bengio, Y., Simard, P., Frasconi, P.: Learning long-term dependencies with gradient descent is difficult. IEEE Trans. Neural Netw. 5(2), 157\u2013166 (1994)","journal-title":"IEEE Trans. Neural Netw."},{"key":"922_CR3","doi-asserted-by":"crossref","unstructured":"Biggio, B., Corona, I., Maiorca, D., Nelson, B., \u0160rndi\u0107, N., Laskov, P., Giacinto, G., Roli, F.: Evasion attacks against machine learning at test time. In: Joint European Conference on Machine Learning and Knowledge Discovery in Databases, Springer, pp. 387\u2013402 (2013)","DOI":"10.1007\/978-3-642-40994-3_25"},{"issue":"2","key":"922_CR4","doi-asserted-by":"publisher","first-page":"223","DOI":"10.1137\/16M1080173","volume":"60","author":"L Bottou","year":"2018","unstructured":"Bottou, L., Curtis, F.E., Nocedal, J.: Optimization methods for large-scale machine learning. SIAM Rev. 60(2), 223\u2013311 (2018)","journal-title":"SIAM Rev."},{"key":"922_CR5","doi-asserted-by":"crossref","unstructured":"Chang, B., Meng, L., Haber, E., Ruthotto, L., Begert, D., Holtham, E.: Reversible architectures for arbitrarily deep residual neural networks. In: Thirty-Second AAAI Conference on Artificial Intelligence (2018)","DOI":"10.1609\/aaai.v32i1.11668"},{"key":"922_CR6","unstructured":"Chaudhari, P., Choromanska, A., Soatto, S., LeCun, Y., Baldassi, C., Borgs, C., Chayes, J., Sagun, L., Zecchina, R.: Entropy-SGD: biasing gradient descent into wide valleys. ArXiv e-prints (2016)"},{"issue":"3","key":"922_CR7","doi-asserted-by":"publisher","first-page":"30","DOI":"10.1007\/s40687-018-0148-y","volume":"5","author":"P Chaudhari","year":"2018","unstructured":"Chaudhari, P., Oberman, A., Osher, S., Soatto, S., Carlier, G.: Deep relaxation: partial differential equations for optimizing deep neural networks. Res. Math. Sci. 5(3), 30 (2018)","journal-title":"Res. Math. Sci."},{"key":"922_CR8","volume-title":"Some Gronwall Type Inequalities and Applications","author":"SS Dragomir","year":"2003","unstructured":"Dragomir, S.S.: Some Gronwall Type Inequalities and Applications. Nova Science Publishers, New York (2003)"},{"key":"922_CR9","unstructured":"Du, S.S., Zhai, X., Poczos, Barnabas, S., Aarti: gradient descent provably optimizes over-parameterized neural networks. ArXiv e-prints (2018)"},{"key":"922_CR10","doi-asserted-by":"publisher","first-page":"347","DOI":"10.1007\/s10107-005-0619-y","volume":"104","author":"JF Edmond","year":"2005","unstructured":"Edmond, J.F., Thibault, L.: Relaxation of an optimal control problem involving a perturbed sweeping process. Math. Program. Ser. B 104, 347\u2013373 (2005)","journal-title":"Math. Program. Ser. B"},{"key":"922_CR11","unstructured":"Goldstein, T., Studer, C., Baraniuk, R.: A field guide to forward-backward splitting with a FASTA implementation. ArXiv e-prints (2014)"},{"key":"922_CR12","unstructured":"Gomez, A.\u00a0N., Ren, M., Urtasun, R., Grosse, R.\u00a0B.: The reversible residual network: backpropagation without storing activations. In: Advances in Neural Information Processing Systems, pp. 2214\u20132224 (2017)"},{"key":"922_CR13","unstructured":"Goodfellow, I.J., Pouget-Abadie, J., Mirza, M., Xu, B., Warde-Farley, D., Ozair, S., Courville, A., Bengio, Y.: Generative adversarial nets. In: Advances in Neural Information Processing Systems, pp. 2672\u20132680 (2014)"},{"issue":"1","key":"922_CR14","doi-asserted-by":"publisher","first-page":"014004","DOI":"10.1088\/1361-6420\/aa9a90","volume":"34","author":"E Haber","year":"2017","unstructured":"Haber, E., Ruthotto, L.: Stable architectures for deep neural networks. Inverse Probl. 34(1), 014004 (2017)","journal-title":"Inverse Probl."},{"key":"922_CR15","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Delving deep into rectifiers: surpassing human-level performance on imagenet classification. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1026\u20131034 (2015)","DOI":"10.1109\/ICCV.2015.123"},{"key":"922_CR16","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"922_CR17","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Identity mappings in deep residual networks. In: European Conference on Computer Vision, Springer, pp. 630\u2013645 (2016)","DOI":"10.1007\/978-3-319-46493-0_38"},{"key":"922_CR18","doi-asserted-by":"crossref","unstructured":"Huang, G., Liu, Z., Van Der\u00a0Maaten, L., Weinberger, K.\u00a0Q.: Densely connected convolutional networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4700\u20134708 (2017)","DOI":"10.1109\/CVPR.2017.243"},{"key":"922_CR19","unstructured":"Ioffe, S., Szegedy, C.: Batch normalization: accelerating deep network training by reducing internal covariate shift. ArXiv e-prints (2015)"},{"key":"922_CR20","doi-asserted-by":"publisher","first-page":"213","DOI":"10.1016\/j.nahs.2018.05.007","volume":"30","author":"M Kamenskii","year":"2018","unstructured":"Kamenskii, M., Makarenkov, O., Wadippuli, L.N., de\u00a0Fitte, P.R.: Global stability of almost periodic solutions to monotone sweeping processes and their response to non-monotone perturbations. Nonlinear Anal. Hybrid Syst. 30, 213\u2013224 (2018)","journal-title":"Nonlinear Anal. Hybrid Syst."},{"key":"922_CR21","unstructured":"Keskar, N.\u00a0S., Mudigere, D., Nocedal, J., Smelyanskiy, M., Tang, P.T.P.: On large-batch training for deep learning: generalization gap and sharp minima. In: International Conference on Learning Representations (2017)"},{"key":"922_CR22","unstructured":"Krizhevsky, A., Sutskever, I., Hinton, G.E.: ImageNet classification with deep convolutional neural networks. In: Advances in Neural Information Processing Systems, pp. 1097\u20131105 (2012)"},{"key":"922_CR23","unstructured":"Larsson, G., Maire, M., Shakhnarovich, G.: FractalNet: Ultra-deep neural networks without residuals. ArXiv e-prints (2016)"},{"issue":"7553","key":"922_CR24","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun, Y., Bengio, Y., Hinton, G.: Deep learning. Nature 521(7553), 436 (2015)","journal-title":"Nature"},{"issue":"4","key":"922_CR25","doi-asserted-by":"publisher","first-page":"541","DOI":"10.1162\/neco.1989.1.4.541","volume":"1","author":"Y LeCun","year":"1989","unstructured":"LeCun, Y., Boser, B., Denker, J.S., Henderson, D., Howard, R.E., Hubbard, W., Jackel, L.D.: Backpropagation applied to handwritten zip code recognition. Neural Comput. 1(4), 541\u2013551 (1989)","journal-title":"Neural Comput."},{"key":"922_CR26","unstructured":"Li, H., Xu, Z., Taylor, G., Studer, C., Goldstein, T.: Visualizing the loss landscape of neural nets. In: Advances in Neural Information Processing Systems, pp. 6389\u20136399 (2018)"},{"key":"922_CR27","unstructured":"Li, Z., Shi, Z.: Deep residual learning and PDEs on manifold. arXiv preprint arXiv:1708.05115 (2017)"},{"issue":"6","key":"922_CR28","doi-asserted-by":"publisher","first-page":"964","DOI":"10.1137\/0716071","volume":"16","author":"P-L Lions","year":"1979","unstructured":"Lions, P.-L., Mercier, B.: Splitting algorithms for the sum of two nonlinear operators. SIAM J. Numer. Anal. 16(6), 964\u2013979 (1979)","journal-title":"SIAM J. Numer. Anal."},{"key":"922_CR29","doi-asserted-by":"publisher","first-page":"1235","DOI":"10.1090\/S0002-9947-96-01543-7","volume":"348","author":"BS Mordukhovich","year":"1996","unstructured":"Mordukhovich, B.S., Shao, Y.: Nonsmooth sequential analysis in asplund spaces. Trans. Am. Math. Soc. 348, 1235\u20131280 (1996)","journal-title":"Trans. Am. Math. Soc."},{"key":"922_CR30","unstructured":"Oberman, A.\u00a0M., Calder, J.: Lipschitz regularized deep neural networks converge and generalize. ArXiv e-prints (2018)"},{"issue":"5","key":"922_CR31","doi-asserted-by":"publisher","first-page":"1805","DOI":"10.1090\/S0002-9947-96-01544-9","volume":"348","author":"RA Poliquin","year":"1996","unstructured":"Poliquin, R.A., Rockafellar, R.T.: Prox-regular functions in variational analysis. Trans. Am. Math. Soc. 348(5), 1805\u20131838 (1996)","journal-title":"Trans. Am. Math. Soc."},{"issue":"3","key":"922_CR32","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky, O., Deng, J., Hao, S., Krause, J., Satheesh, S., Ma, S., Huang, Z., Karpathy, A., Khosla, A., Bernstein, M., Berg, A.C., Fei-Fei, L.: ImageNet large scale visual recognition challenge. Int. J. Comput. Vis. (IJCV) 115(3), 211\u2013252 (2015)","journal-title":"Int. J. Comput. Vis. (IJCV)"},{"key":"922_CR33","doi-asserted-by":"crossref","unstructured":"Ruthotto, L., Haber, E.: Deep neural networks motivated by partial differential equations. ArXiv e-prints (2018)","DOI":"10.1007\/s10851-019-00903-1"},{"issue":"7","key":"922_CR34","doi-asserted-by":"publisher","first-page":"1757","DOI":"10.4310\/CMS.2018.v16.n7.a1","volume":"16","author":"H Schaeffer","year":"2018","unstructured":"Schaeffer, H.: A penalty method for some nonlinear variational obstacle problems. Commun. Math. Sci. 16(7), 1757\u20131777 (2018)","journal-title":"Commun. Math. Sci."},{"key":"922_CR35","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. ArXiv e-prints (2014)"},{"key":"922_CR36","unstructured":"Singer, Y., Duchi, J.C.: Efficient learning using forward\u2013backward splitting. In: Advances in Neural Information Processing Systems, vol. 22, Curran Associates, Inc., pp. 495\u2013503 (2009)"},{"key":"922_CR37","unstructured":"Sussillo, D., Abbott, L.F.: Random walk initialization for training very deep feedforward networks. ArXiv e-prints (2014)"},{"key":"922_CR38","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Liu, W., Jia, Y., Sermanet, P., Reed, S., Anguelov, D., Erhan, D., Vanhoucke, V., Rabinovich, A.: Going deeper with convolutions. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1\u20139 (2015)","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"922_CR39","unstructured":"Szegedy, C., Zaremba, W., Sutskever, I., Bruna, J., Erhan, D., Goodfellow, I., Fergus, R.: Intriguing properties of neural networks. ArXiv e-prints (2013)"},{"key":"922_CR40","unstructured":"Thorpe, M., van Gennip, Y.: Deep limits of residual neural networks. ArXiv e-prints (2018)"},{"issue":"4","key":"922_CR41","doi-asserted-by":"publisher","first-page":"1424","DOI":"10.1137\/140963303","volume":"75","author":"G Tran","year":"2015","unstructured":"Tran, G., Schaeffer, H., Feldman, W.M., Osher, S.J.: An $l^1$ penalty method for general obstacle problems. SIAM J. Appl. Math. 75(4), 1424\u20131444 (2015)","journal-title":"SIAM J. Appl. Math."},{"key":"922_CR42","unstructured":"Vidal, R., Bruna, J., Giryes, R., Soatto, S.: Mathematics of deep learning. ArXiv e-prints (2017)"},{"key":"922_CR43","unstructured":"Wang, B., Luo, X., Li, Z., Zhu, W., Shi, Z., Osher, S.: Deep neural nets with interpolating function as output activation. In: Advances in Neural Information Processing Systems, pp. 743\u2013753 (2018)"},{"issue":"1","key":"922_CR44","doi-asserted-by":"publisher","first-page":"10","DOI":"10.1007\/s40687-018-0172-y","volume":"6","author":"E Weinan","year":"2019","unstructured":"Weinan, E., Han, J., Li, Q.: A mean-field optimal control formulation of deep learning. Res. Math. Sci. 6(1), 10 (2019)","journal-title":"Res. Math. Sci."},{"issue":"1","key":"922_CR45","first-page":"1","volume":"5","author":"E Weinan","year":"2017","unstructured":"Weinan, E.: A proposal on machine learning via dynamical systems. Commun. Math. Stat. 5(1), 1\u201311 (2017)","journal-title":"Commun. Math. Stat."}],"container-title":["Journal of Mathematical Imaging and Vision"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10851-019-00922-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10851-019-00922-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10851-019-00922-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,10,3]],"date-time":"2022-10-03T08:03:36Z","timestamp":1664784216000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10851-019-00922-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,11,1]]},"references-count":45,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2020,4]]}},"alternative-id":["922"],"URL":"https:\/\/doi.org\/10.1007\/s10851-019-00922-y","relation":{},"ISSN":["0924-9907","1573-7683"],"issn-type":[{"value":"0924-9907","type":"print"},{"value":"1573-7683","type":"electronic"}],"subject":[],"published":{"date-parts":[[2019,11,1]]},"assertion":[{"value":"24 November 2018","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 October 2019","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 November 2019","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}