{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,9]],"date-time":"2026-03-09T22:07:09Z","timestamp":1773094029868,"version":"3.50.1"},"publisher-location":"Berlin, Heidelberg","reference-count":23,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"value":"9783540653110","type":"print"},{"value":"9783540494300","type":"electronic"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[1998]]},"DOI":"10.1007\/3-540-49430-8_11","type":"book-chapter","created":{"date-parts":[[2007,8,11]],"date-time":"2007-08-11T14:57:33Z","timestamp":1186844253000},"page":"207-226","source":"Crossref","is-referenced-by-count":21,"title":["Centering Neural Network Gradient Factors"],"prefix":"10.1007","author":[{"given":"Nicol N.","family":"Schraudolph","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2002,3,28]]},"reference":[{"key":"11_CR1","volume-title":"Neurocomputing: Foundations of Research","year":"1988","unstructured":"J. Anderson and E. Rosenfeld, editors. Neurocomputing: Foundations of Research. MIT Press, Cambridge, 1988."},{"key":"11_CR2","first-page":"331","volume":"3","author":"R. Battiti","year":"1989","unstructured":"R. Battiti. Accelerated back-propagation learning: Two optimization methods. Complex Systems, 3:331\u2013342, 1989.","journal-title":"Complex Systems"},{"issue":"2","key":"11_CR3","doi-asserted-by":"publisher","first-page":"141","DOI":"10.1162\/neco.1992.4.2.141","volume":"4","author":"R. Battiti","year":"1992","unstructured":"R. Battiti. First-and second-order methods for learning: Between steepest descent and Newton\u2019s method. Neural Computation, 4(2):141\u2013166, 1992.","journal-title":"Neural Computation"},{"key":"11_CR4","doi-asserted-by":"crossref","unstructured":"E. Bienenstock, L. Cooper, and P. Munro. Theory for the development of neuron selectivity: Orientation specificity and binocular interaction in visual cortex. Journal of Neuroscience, 2, 1982. Reprinted in [1].","DOI":"10.1523\/JNEUROSCI.02-01-00032.1982"},{"key":"11_CR5","unstructured":"D. H. Deterding. Speaker Normalisation for Automatic Speech Recognition. PhD thesis, University of Cambridge, 1989."},{"key":"11_CR6","volume-title":"Proceedings of the 1993 Connectionist Models Summer School","author":"M. Finke","year":"1994","unstructured":"M. Finke and K.-R. M\u00fcller. Estimating a-posteriori probabilities using stochastic network models. In M. C. Mozer, P. Smolensky, D. S. Touretzky, J. L. Elman, and A. S. Weigend, editors, Proceedings of the 1993 Connectionist Models Summer School, Boulder, CO, 1994. Lawrence Erlbaum Associates, Hillsdale, NJ."},{"issue":"6","key":"11_CR7","doi-asserted-by":"publisher","first-page":"607","DOI":"10.1109\/34.506411","volume":"18","author":"T. J. Hastie","year":"1996","unstructured":"T. J. Hastie and R. J. Tibshirani. Discriminant adaptive nearest neighbor classification. IEEE Transactions on Pattern Analysis and Machine Intelligence, 18(6):607\u2013616, 1996.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"11_CR8","unstructured":"M. Herrmann. On the merits of topography in neural maps. In T. Kohonen, editor, Proceedings of the Workshop on Self-Organizing Maps, pages 112\u2013117. Helsinki University of Technology, 1997."},{"key":"11_CR9","doi-asserted-by":"crossref","unstructured":"S. Hochreiter and J. Schmidhuber. Feature extraction through lococode. To appear in Neural Computation, 1998.","DOI":"10.1162\/089976699300016629"},{"issue":"1","key":"11_CR10","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1162\/neco.1992.4.1.98","volume":"4","author":"N. Intrator","year":"1992","unstructured":"N. Intrator. Feature extraction using an unsupervised neural network. Neural Computation, 4(1):98\u2013107, 1992.","journal-title":"Neural Computation"},{"key":"11_CR11","first-page":"247","volume":"D 22","author":"A. Lapedes","year":"1986","unstructured":"A. Lapedes and R. Farber. A self-optimizing, nonsymmetrical neural net for content addressable memory and pattern recognition. Physica, D 22:247\u2013259, 1986.","journal-title":"Physica"},{"issue":"18","key":"11_CR12","doi-asserted-by":"publisher","first-page":"2396","DOI":"10.1103\/PhysRevLett.66.2396","volume":"66","author":"Y. LeCun","year":"1991","unstructured":"Y. LeCun, I. Kanter, and S. A. Solla. Eigenvalues of covariance matrices: Application to neural-network learning. Physical Review Letters, 66(18):2396\u20132399, 1991.","journal-title":"Physical Review Letters"},{"key":"11_CR13","unstructured":"A. J. Robinson. Dynamic Error Propagation Networks. PhD thesis, University of Cambridge, 1989."},{"key":"11_CR14","first-page":"499","volume-title":"Advances in Neural Information Processing Systems","author":"N. N. Schraudolph","year":"1993","unstructured":"N. N. Schraudolph and T. J. Sejnowski. Unsupervised discrimination of clustered data via optimization of binary information gain. In S. J. Hanson, J. D. Cowan, and C. L. Giles, editors, Advances in Neural Information Processing Systems, volume 5, pages 499\u2013506. Morgan Kaufmann, San Mateo, CA, 1993."},{"key":"11_CR15","first-page":"563","volume-title":"Advances in Neural Information Processing Systems","author":"N. N. Schraudolph","year":"1996","unstructured":"N. N. Schraudolph and T. J. Sejnowski. Tempering backpropagation networks: Not all weights are created equal. In D. S. Touretzky, M. C. Mozer, and M. E. Hasselmo, editors, Advances in Neural Information Processing Systems, volume 8, pages 563\u2013569. The MIT Press, Cambridge, MA, 1996."},{"key":"11_CR16","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/BF00275079","volume":"4","author":"T. J. Sejnowski","year":"1977","unstructured":"T. J. Sejnowski. Storing covariance with nonlinearly interacting neurons. Journal of Mathematical Biology, 4:303\u2013321, 1977.","journal-title":"Journal of Mathematical Biology"},{"key":"11_CR17","doi-asserted-by":"publisher","first-page":"779","DOI":"10.1016\/S0893-6080(05)80139-X","volume":"5","author":"S. Shah","year":"1992","unstructured":"S. Shah, F. Palmieri, and M. Datum. Optimal filtering algorithms for fast learning in feedforward neural networks. Neural Networks, 5:779\u2013787, 1992.","journal-title":"Neural Networks"},{"key":"11_CR18","first-page":"662","volume-title":"Advances in Neural Information Processing Systems","author":"J. B. Tenenbaum","year":"1997","unstructured":"J. B. Tenenbaum and W. T. Freeman. Separating style and content. In M. C. Mozer, M. I. Jordan, and T. Petsche, editors, Advances in Neural Information Processing Systems, volume 9, pages 662\u2013668. The MIT Press, Cambridg, MA, 1997."},{"key":"11_CR19","doi-asserted-by":"crossref","unstructured":"P. D. Turney. Exploiting context when learning to classify. In Proceedings of the European Conference on Machine Learning, pages 402\u2013407, 1993.","DOI":"10.1007\/3-540-56602-3_158"},{"key":"11_CR20","unstructured":"P. D. Turney. Robust classification with context-sensitive features. In Proceedings of the Sixth International Conference on Industrial and Engineering Applications of Artificial Intelligence and Expert Systems, pages 268\u2013276, 1993."},{"key":"11_CR21","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1007\/BF00332914","volume":"59","author":"T. P. Vogl","year":"1988","unstructured":"T. P. Vogl, J. K. Mangis, A. K. Rigler, W. T. Zink, and D. L. Alkon. Accelerating the convergence of the back-propagation method. Biological Cybernetics, 59:257\u2013263, 1988.","journal-title":"Biological Cybernetics"},{"issue":"8","key":"11_CR22","doi-asserted-by":"publisher","first-page":"1151","DOI":"10.1109\/PROC.1976.10286","volume":"64","author":"B. Widrow","year":"1976","unstructured":"B. Widrow, J. M. McCool, M. G. Larimore, and C. R. Johnson, Jr. Stationary and nonstationary learning characteristics of the LMS adaptive filter. Proceedings of the IEEE, 64(8):1151\u20131162, 1976.","journal-title":"Proceedings of the IEEE"},{"key":"11_CR23","first-page":"1","volume-title":"Neuronale Netze in der \u00f6konomie: Grundlagen und finanzwirtschaftliche Anwendungen","author":"H. G. Zimmermann","year":"1994","unstructured":"H. G. Zimmermann. Neuronale Netze als Entscheidungskalk\u00fcl. In H. Rehkugler and H. G. Zimmermann, editors, Neuronale Netze in der \u00f6konomie: Grundlagen und finanzwirtschaftliche Anwendungen, pages 1\u201387. Vahlen Verlag, Munich, 1994."}],"container-title":["Lecture Notes in Computer Science","Neural Networks: Tricks of the Trade"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/3-540-49430-8_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,1]],"date-time":"2019-05-01T23:29:53Z","timestamp":1556753393000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/3-540-49430-8_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1998]]},"ISBN":["9783540653110","9783540494300"],"references-count":23,"URL":"https:\/\/doi.org\/10.1007\/3-540-49430-8_11","relation":{},"ISSN":["0302-9743"],"issn-type":[{"value":"0302-9743","type":"print"}],"subject":[],"published":{"date-parts":[[1998]]}}}