{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,12]],"date-time":"2026-06-12T05:45:43Z","timestamp":1781243143426,"version":"3.54.1"},"reference-count":24,"publisher":"Elsevier BV","issue":"4-5","license":[{"start":{"date-parts":[[1993,6,1]],"date-time":"1993-06-01T00:00:00Z","timestamp":738892800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Neurocomputing"],"published-print":{"date-parts":[[1993,6]]},"DOI":"10.1016\/0925-2312(93)90006-o","type":"journal-article","created":{"date-parts":[[2003,9,3]],"date-time":"2003-09-03T13:52:02Z","timestamp":1062597122000},"page":"185-196","source":"Crossref","is-referenced-by-count":816,"title":["Backpropagation and stochastic gradient descent method"],"prefix":"10.1016","volume":"5","author":[{"given":"Shun-ichi","family":"Amari","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"78","reference":[{"key":"10.1016\/0925-2312(93)90006-O_BIB1","first-page":"1307","article-title":"A probabilistic problem on training automata to recognize classes and the method of potential functions","volume":"25","author":"Aizerman","year":"1964","journal-title":"Automation and Remote Control"},{"key":"10.1016\/0925-2312(93)90006-O_BIB2","doi-asserted-by":"crossref","first-page":"299","DOI":"10.1109\/PGEC.1967.264666","article-title":"Theory of adaptive pattern classifiers","volume":"EC-16","author":"Amari","year":"1967","journal-title":"IEEE Trans. Elect. Comput."},{"key":"10.1016\/0925-2312(93)90006-O_BIB3","series-title":"Geometrical Theory of Information","author":"Amari","year":"1968"},{"key":"10.1016\/0925-2312(93)90006-O_BIB4","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4612-5056-2_2","article-title":"Differential-geometrical methods of statistics","volume":"28","author":"Amari","year":"1985","journal-title":"Springer Lecture Notes in Statistics"},{"key":"10.1016\/0925-2312(93)90006-O_BIB5","first-page":"1443","article-title":"Mathematical foundations of neurocomputing","volume":"78","author":"Amari","year":"1990"},{"key":"10.1016\/0925-2312(93)90006-O_BIB6","doi-asserted-by":"crossref","first-page":"443","DOI":"10.1016\/0893-6080(91)90040-C","article-title":"Dualistic geometry of the manifold of higher-order neurons","volume":"4","author":"Amari","year":"1991","journal-title":"Neural Networks"},{"key":"10.1016\/0925-2312(93)90006-O_BIB7","doi-asserted-by":"crossref","first-page":"605","DOI":"10.1162\/neco.1992.4.4.605","article-title":"Four types of learning curves","volume":"4","author":"Amari","year":"1992","journal-title":"Neural Computat."},{"key":"10.1016\/0925-2312(93)90006-O_BIB8","doi-asserted-by":"crossref","first-page":"260","DOI":"10.1109\/72.125867","article-title":"Information geometry of Boltzmann machines","volume":"3","author":"Amari","year":"1992","journal-title":"IEEE Trans. Neural Networks"},{"key":"10.1016\/0925-2312(93)90006-O_BIB9","doi-asserted-by":"crossref","first-page":"123","DOI":"10.1103\/RevModPhys.34.123","article-title":"The perception, a model for brain functioning I","volume":"34","author":"Block","year":"1962","journal-title":"Rev. Modern Physics"},{"key":"10.1016\/0925-2312(93)90006-O_BIB10","doi-asserted-by":"crossref","first-page":"135","DOI":"10.1103\/RevModPhys.34.135","article-title":"Analysis of a four-layer series coupled perceptron II","volume":"34","author":"Block","year":"1962","journal-title":"Rev. Modern Physics"},{"key":"10.1016\/0925-2312(93)90006-O_BIB11","doi-asserted-by":"crossref","first-page":"2718","DOI":"10.1103\/PhysRevA.44.2718","article-title":"Learning processes in neural networks","volume":"A440","author":"Heskes","year":"1991","journal-title":"Physical Rev."},{"key":"10.1016\/0925-2312(93)90006-O_BIB12","series-title":"Proc. Connectionists Summer School","article-title":"Equivalence proofs for multilayer perceptron classifiers and the Bayesian discriminant function","author":"Hampshire","year":"1990"},{"key":"10.1016\/0925-2312(93)90006-O_BIB13","doi-asserted-by":"crossref","first-page":"59","DOI":"10.1007\/BF00337288","article-title":"Self-organized formation of topologically correct feature maps","volume":"43","author":"Kohonen","year":"1982","journal-title":"Biol. Cybernet."},{"key":"10.1016\/0925-2312(93)90006-O_BIB14","first-page":"981","article-title":"Self organizing maps: Optimization approaches","volume":"vol. 2","author":"Kohonen","year":"1991"},{"key":"10.1016\/0925-2312(93)90006-O_BIB15","series-title":"Information Theory and Statistics","author":"Kullback","year":"1959"},{"key":"10.1016\/0925-2312(93)90006-O_BIB16","doi-asserted-by":"crossref","first-page":"978","DOI":"10.1126\/science.247.4945.978","article-title":"Regularization algorithms for learning that are equivalent to multilayer networks","volume":"247","author":"Poggio","year":"1990","journal-title":"Science"},{"key":"10.1016\/0925-2312(93)90006-O_BIB17","doi-asserted-by":"crossref","first-page":"461","DOI":"10.1162\/neco.1991.3.4.461","article-title":"Neural network classifiers estimate Bayesian a posteriori probabilities","volume":"3","author":"Richard","year":"1991","journal-title":"Neural Comput."},{"key":"10.1016\/0925-2312(93)90006-O_BIB18","article-title":"Learning logic","author":"Parker","year":"1982"},{"key":"10.1016\/0925-2312(93)90006-O_BIB19","article-title":"Principles of Neurodynamics","author":"Rosenblatt","year":"1961"},{"key":"10.1016\/0925-2312(93)90006-O_BIB20","first-page":"318","article-title":"Learning internal representations by error propagation","volume":"vol. 1","author":"Rumelhart","year":"1986"},{"key":"10.1016\/0925-2312(93)90006-O_BIB21","series-title":"Stochastic Approximation","author":"Wasan","year":"1969"},{"key":"10.1016\/0925-2312(93)90006-O_BIB22","article-title":"Beyond regression: New Tool for prediction and analysis in the behavioral sciences","author":"Werbos","year":"1974"},{"key":"10.1016\/0925-2312(93)90006-O_BIB23","series-title":"A Statistical theory of Adaptation","author":"Widrow","year":"1963"},{"key":"10.1016\/0925-2312(93)90006-O_BIB24","doi-asserted-by":"crossref","first-page":"425","DOI":"10.1162\/neco.1989.1.4.425","article-title":"Learning in artificial networks: A statistical perspective","volume":"1","author":"White","year":"1989","journal-title":"Neural Comput."}],"container-title":["Neurocomputing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:092523129390006O?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:092523129390006O?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2019,2,25]],"date-time":"2019-02-25T05:22:55Z","timestamp":1551072175000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/092523129390006O"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1993,6]]},"references-count":24,"journal-issue":{"issue":"4-5","published-print":{"date-parts":[[1993,6]]}},"alternative-id":["092523129390006O"],"URL":"https:\/\/doi.org\/10.1016\/0925-2312(93)90006-o","relation":{},"ISSN":["0925-2312"],"issn-type":[{"value":"0925-2312","type":"print"}],"subject":[],"published":{"date-parts":[[1993,6]]}}}