{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,17]],"date-time":"2026-02-17T15:41:15Z","timestamp":1771342875178,"version":"3.50.1"},"publisher-location":"Berlin, Heidelberg","reference-count":28,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"value":"9783540643418","type":"print"},{"value":"9783540697527","type":"electronic"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[1998]]},"DOI":"10.1007\/bfb0053994","type":"book-chapter","created":{"date-parts":[[2006,6,7]],"date-time":"2006-06-07T01:55:04Z","timestamp":1149645304000},"page":"27-62","source":"Crossref","is-referenced-by-count":15,"title":["Gradient based learning methods"],"prefix":"10.1007","author":[{"given":"Ah Chung","family":"Tsoi","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ah Chung","family":"Tsoi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2006,5,25]]},"reference":[{"key":"2_CR1","doi-asserted-by":"publisher","first-page":"975","DOI":"10.1016\/S0893-6080(09)80007-5","volume":"6","author":"F. Albertini","year":"1993","unstructured":"Albertini, F., Sontag, E. \u201cFor neural networks, function determines form\u201d. Neural Networks. Vol 6, pp 975\u2013990, 1993.","journal-title":"Neural Networks"},{"key":"2_CR2","volume-title":"Optimal Filtering","author":"B. Anderson","year":"1979","unstructured":"Anderson, B., Moore, J. Optimal Filtering. Prentice Hall, Englewood Cliffs, N.J., 1979."},{"issue":"No.3","key":"2_CR3","doi-asserted-by":"crossref","first-page":"375","DOI":"10.1162\/neco.1991.3.3.375","volume":"3","author":"A.D. Back","year":"1991","unstructured":"Back, A.D., Tsoi, A.C. \u201cFIR and IIR synapses, a new neural network architecture for time series modelling\u201d. Neural Computation. Vol. 3, No. 3, pp 375\u2013385, 1991.","journal-title":"Neural Computation"},{"key":"2_CR4","doi-asserted-by":"crossref","unstructured":"Back, A.D., Tsoi, A.C. \u201cA low sensitivity recurrent neural network\u201d. Neural Computation. To appear.","DOI":"10.1162\/089976698300017935"},{"issue":"No1","key":"2_CR5","doi-asserted-by":"publisher","first-page":"182","DOI":"10.1109\/72.363438","volume":"6","author":"P. Baldi","year":"1995","unstructured":"Baldi, P. \u201cGradient descent learning algorithm overview: A general dynamical systems perspective\u201d. IEEE Trans on Neural Networks. Vol. 6, No 1, Jan. pp 182\u2013195, 1995.","journal-title":"IEEE Trans on Neural Networks"},{"key":"2_CR6","unstructured":"Bryson, A., Ho, Y.C. Applied Optimal Control. Blaisdall Publishing Co., 1969."},{"key":"2_CR7","doi-asserted-by":"publisher","first-page":"179","DOI":"10.1016\/0364-0213(90)90002-E","volume":"14","author":"J. Elman","year":"1990","unstructured":"Elman, J. \u201cFinding structure in time\u201d. Cognitive Science. Vol. 14, pp 179\u2013211, 1990.","journal-title":"Cognitive Science"},{"key":"2_CR8","doi-asserted-by":"crossref","first-page":"120","DOI":"10.1162\/neco.1992.4.1.120","volume":"4","author":"P. Frasconi","year":"1992","unstructured":"Frasconi, P., Gori, M., Soda, G. \u201cLocal feedback multilayered networks\u201d. Neural Computation. Vol. 4, pp 120\u2013130, 1992.","journal-title":"Neural Computation"},{"key":"2_CR9","volume-title":"Practical Optimization","author":"P. Gill","year":"1981","unstructured":"Gill, P., Murray, W., Wright, M. Practical Optimization. Academic Press. New York, 1981."},{"key":"2_CR10","volume-title":"Adaptive filtering, prediction and control","author":"G. Goodwin","year":"1984","unstructured":"Goodwin, G., Sin, K. S. Adaptive filtering, prediction and control. Prentice Hall, Englewood Cliffs, N.J. 1984."},{"key":"2_CR11","doi-asserted-by":"crossref","unstructured":"Hassibi, B., Stork, D., Wolff, G.J., \u201cOptimal Brain Surgeon and general network pruning\u201d. IEEE International Conference on Neural Networks. San Francisco (Ed. E. H. Ruspini et al), pp 293\u2013299, 1993.","DOI":"10.1109\/ICNN.1993.298572"},{"key":"2_CR12","unstructured":"Haykin, S. Neural Networks, A comprehensive foundation. MacMillan College Pub Co. 1994."},{"key":"2_CR13","doi-asserted-by":"publisher","first-page":"251","DOI":"10.1016\/0893-6080(91)90009-T","volume":"4","author":"K. Hornik","year":"1990","unstructured":"Hornik, K. \u201cApproximation capabilities of multilayer feedforward neural networks\u201d. Neural Networks. Vol. 4, pp 251\u2013257, 1990.","journal-title":"Neural Networks"},{"key":"2_CR14","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S. Hochreiter","year":"1997","unstructured":"Hochreiter, S., Schmidhuber, J. \u201cLong sort-term memory\u201d. Neural Computation. Vol 9, pp 1735\u20131780, 1997.","journal-title":"Neural Computation"},{"key":"2_CR15","volume-title":"Linear Systems","author":"T. Kailath","year":"1980","unstructured":"Kailath, T. Linear Systems. Prentice Hall, Englewood Cliffs, N.J., 1980."},{"key":"2_CR16","unstructured":"Lawrence, S., Giles, L., Back, A., Tsoi, A. C. \u201cThe gamma MLP \u2014 multiple temporal resolutions, the curse of dimensionality, and gradient descent learning\u201d. Neural Computation To appear."},{"key":"2_CR17","unstructured":"Le Cun, Y., Denker, J., Solla, S. \u201cOptimal brain damage\u201d. Advances in Neural Information Processing Systems, 2. Morgan Kaufman, pp 598\u2013605, 1990."},{"key":"2_CR18","doi-asserted-by":"publisher","first-page":"2152","DOI":"10.1049\/el:19961443","volume":"32","author":"C.S. Leung","year":"1996","unstructured":"Leung, C.S., Wong, K. W., Sum, J., Chan, L.W. \u201cOnline training and pruning for RLS algorithms\u201d. Electronics Letters. Vol. 32, pp 2152\u20132153, 1996.","journal-title":"Electronics Letters"},{"key":"2_CR19","unstructured":"M\u00fcller, M. Efficient Training of Feedforward Neural Networks. PhD thesis, Aarhus University, Dec, 1993."},{"key":"2_CR20","doi-asserted-by":"crossref","first-page":"165","DOI":"10.1162\/neco.1993.5.2.165","volume":"5","author":"O. Nerrand","year":"1993","unstructured":"Nerrand, O., Roussel-Ragot, P., Personnaz, L., Dreyfus, G., Marcos, S. \u201cNeural Networks and nonlinear adaptive filtering: Unifying concepts and new algorithms\u201d. Neural Computation. Vol 5, pp 165\u2013197, 1993.","journal-title":"Neural Computation"},{"key":"2_CR21","doi-asserted-by":"publisher","first-page":"649","DOI":"10.1109\/78.193206","volume":"41","author":"J. Principe","year":"1993","unstructured":"Principe, J., de Vries, B., Oliveira, P. \u201cThe gamma filter \u2014 a new class of adaptive IIR filters with restricted feedback\u201d. IEEE Trans Signal Processing. Vol. 41, pp 649\u2013656, 1993.","journal-title":"IEEE Trans Signal Processing"},{"key":"2_CR22","doi-asserted-by":"publisher","first-page":"279","DOI":"10.1109\/72.279191","volume":"5","author":"G. V. Puskorius","year":"1994","unstructured":"Puskorius, G. V., Feldkamp, L. A. \u201cNeurocontrol of nonlinear dynamical systems with Kaiman filter trained recurrent networks\u201d. IEEE Trans Neural Networks. Vol. 5, pp 279\u2013297, 1994.","journal-title":"IEEE Trans Neural Networks"},{"key":"2_CR23","volume-title":"PhD thesis","author":"A.J. Robinson","year":"1989","unstructured":"Robinson, A.J. Dynamic error propagation networks. PhD thesis, University of Cambridge, Cambridge, U.K., 1989."},{"key":"2_CR24","unstructured":"Scarselli, F. Tsoi, A.C. \u201cUniversal approximation using feedforward neural networks: A survey of some existing methods, and some results\u201d. Neural Networks. To appear."},{"issue":"No.2","key":"2_CR25","doi-asserted-by":"publisher","first-page":"229","DOI":"10.1109\/72.279187","volume":"5","author":"A.C. Tsoi","year":"1994","unstructured":"Tsoi, A.C., Back, A.D. \u201cLocally recurrent globally feedforward networks: a critical review of architectures\u201d. IEEE Trans on Neural Networks. Vol. 5, No. 2, pp 229\u2013239, 1994.","journal-title":"IEEE Trans on Neural Networks"},{"key":"2_CR26","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1016\/S0925-2312(97)00161-6","volume":"15","author":"A.D. Tsoi","year":"1997","unstructured":"Tsoi, A.D., Back, A.D. \u201cDiscrete time recurrent neural network architectures: a unifying review\u201d. Neurocomputing. Vol. 15, pp 183\u2013224, 1997.","journal-title":"Neurocomputing"},{"key":"2_CR27","unstructured":"Wan, E., Beaufays, F. \u201cDiagrammatic methods for deriving and relating temporal neural network algorithms\u201d. This volume."},{"key":"2_CR28","doi-asserted-by":"crossref","first-page":"270","DOI":"10.1162\/neco.1989.1.2.270","volume":"1","author":"R. Williams","year":"1989","unstructured":"Williams, R., Zipser, D. \u201cA learning algorithm for continually running fully recurrent neural networks\u201d. Neural Computation. Vol. 1, pp 270\u2013280, 1989.","journal-title":"Neural Computation"}],"container-title":["Lecture Notes in Computer Science","Adaptive Processing of Sequences and Data Structures"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/BFb0053994","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,2,10]],"date-time":"2019-02-10T18:04:00Z","timestamp":1549821840000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/BFb0053994"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1998]]},"ISBN":["9783540643418","9783540697527"],"references-count":28,"URL":"https:\/\/doi.org\/10.1007\/bfb0053994","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[1998]]}}}