{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T23:28:48Z","timestamp":1769642928315,"version":"3.49.0"},"reference-count":23,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,11,1]],"date-time":"2020-11-01T00:00:00Z","timestamp":1604188800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,11,1]],"date-time":"2020-11-01T00:00:00Z","timestamp":1604188800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,11,1]]},"DOI":"10.1109\/ieeeconf51394.2020.9443275","type":"proceedings-article","created":{"date-parts":[[2021,6,3]],"date-time":"2021-06-03T21:32:35Z","timestamp":1622755955000},"page":"1214-1221","source":"Crossref","is-referenced-by-count":12,"title":["Separating the Effects of Batch Normalization on CNN Training Speed and Stability Using Classical Adaptive Filter Theory"],"prefix":"10.1109","author":[{"given":"Elaina","family":"Chai","sequence":"first","affiliation":[{"name":"Stanford University,Dept. of Electrical Engineering,Stanford,CA"}]},{"given":"Mert","family":"Pilanci","sequence":"additional","affiliation":[{"name":"Stanford University,Dept. of Electrical Engineering,Stanford,CA"}]},{"given":"Boris","family":"Murmann","sequence":"additional","affiliation":[{"name":"Stanford University,Dept. of Electrical Engineering,Stanford,CA"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.21236\/AD0241531"},{"key":"ref11","author":"haykin","year":"2002","journal-title":"Adaptive Filter Theory"},{"key":"ref12","first-page":"563","article-title":"Adaptive filters","author":"widrow","year":"1971","journal-title":"Aspects of Network and System Theory"},{"key":"ref13","article-title":"Learning multiple layers of features from tiny images","author":"krizhevsky","year":"2009"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/35.41400"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/5.726791"},{"key":"ref16","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","volume":"25","author":"krizhevsky","year":"2012","journal-title":"Advances in neural information processing systems"},{"key":"ref17","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2014"},{"key":"ref18","first-page":"249","article-title":"Understanding the difficulty of training deep feedforward neural networks","author":"glorot","year":"2010","journal-title":"Proceedings of the Thirteenth International Conference on Artificial Intelligence and Statistics"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.123"},{"key":"ref4","article-title":"A mean field theory of batch normalization","author":"greg","year":"2019","journal-title":"International Conference on Learning Representations"},{"key":"ref3","first-page":"582","article-title":"Which neural net architectures give rise to exploding and vanishing gradients?","volume":"32","author":"hanin","year":"2018","journal-title":"Advances in neural information processing systems"},{"key":"ref6","first-page":"2488","article-title":"How does batch normalization help optimization?","volume":"32","author":"santurkar","year":"2018","journal-title":"Advances in neural information processing systems"},{"key":"ref5","first-page":"8024","article-title":"Pytorch: An imperative style, high-performance deep learning library","volume":"33","author":"paszke","year":"2019","journal-title":"Advances in neural information processing systems"},{"key":"ref8","first-page":"536","article-title":"The shattered gradients problem: If resnets are the answer, then what is the question?","author":"balduzzi","year":"2017","journal-title":"Proceedings of the 34th International Conference on Machine Learning"},{"key":"ref7","article-title":"Fixup initialization: Residual learning without normalization","author":"zhang","year":"2019","journal-title":"International Conference on Learning Representations"},{"key":"ref2","first-page":"448","article-title":"Batch normalization: Accelerating deep network training by reducing internal covariate shift","author":"ioffe","year":"2015","journal-title":"Proceedings of The 32nd International Conference on Machine Learning"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref9","article-title":"An adaptive adaline neuron using chemical memistors","author":"widrow","year":"1960","journal-title":"Tech Rep TR-1553-2"},{"key":"ref20","first-page":"1","article-title":"All you need is a good init","author":"mishkin","year":"2016","journal-title":"4th International Conference on Learning Representations"},{"key":"ref22","first-page":"156","article-title":"Automatic learning rate maximization by on-line estimation of the hessian&#x2019;s eigenvectors","author":"lecun","year":"1993","journal-title":"Advances in Neural Information Processing Systems 7"},{"key":"ref21","first-page":"6520","article-title":"On the local hessian in backpropagation","volume":"32","author":"zhang","year":"2018","journal-title":"Advances in neural information processing systems"},{"key":"ref23","doi-asserted-by":"crossref","first-page":"9","DOI":"10.1007\/978-3-642-35289-8_3","article-title":"Efficient BackProp","author":"lecun","year":"2012","journal-title":"Neural Networks Tricks of the Trade"}],"event":{"name":"2020 54th Asilomar Conference on Signals, Systems, and Computers","location":"Pacific Grove, CA, USA","start":{"date-parts":[[2020,11,1]]},"end":{"date-parts":[[2020,11,4]]}},"container-title":["2020 54th Asilomar Conference on Signals, Systems, and Computers"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9443248\/9443268\/09443275.pdf?arnumber=9443275","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,2]],"date-time":"2022-08-02T19:58:32Z","timestamp":1659470312000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9443275\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,11,1]]},"references-count":23,"URL":"https:\/\/doi.org\/10.1109\/ieeeconf51394.2020.9443275","relation":{},"subject":[],"published":{"date-parts":[[2020,11,1]]}}}