{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,4]],"date-time":"2025-07-04T09:45:43Z","timestamp":1751622343324},"reference-count":56,"publisher":"Elsevier","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[1998]]},"DOI":"10.1016\/s1874-5946(98)80068-0","type":"book-chapter","created":{"date-parts":[[2008,4,17]],"date-time":"2008-04-17T08:37:47Z","timestamp":1208421467000},"page":"87-121","source":"Crossref","is-referenced-by-count":7,"title":["Weight initialization techniques"],"prefix":"10.1016","author":[{"given":"Mikko","family":"Lehtokangas","sequence":"first","affiliation":[]},{"given":"Jukka","family":"Saarinen","sequence":"additional","affiliation":[]},{"given":"Petri","family":"Salmela","sequence":"additional","affiliation":[]},{"given":"Kimmo","family":"Kaski","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/S1874-5946(98)80068-0_bib1","series-title":"Parallel Distributed Processing: Explorations in the Microstructure of Cognnition","first-page":"318","article-title":"Learning internal representations by error propagation","author":"Rumelhart","year":"1986"},{"key":"10.1016\/S1874-5946(98)80068-0_bib2","series-title":"Proceedings of Computational Learning Theory, COLT'88","first-page":"9","article-title":"Training a 3-node neural networks is NP-complete","author":"Blum","year":"1988"},{"key":"10.1016\/S1874-5946(98)80068-0_bib3","doi-asserted-by":"crossref","first-page":"177","DOI":"10.1016\/0885-064X(88)90019-2","article-title":"On the complexity of loading shallow neural networks","volume":"4","author":"Judd","year":"1988","journal-title":"J. Complexity"},{"key":"10.1016\/S1874-5946(98)80068-0_bib4","doi-asserted-by":"crossref","first-page":"382","DOI":"10.1162\/neco.1989.1.3.382","article-title":"Asymptotic convergence of backpropagation","volume":"1","author":"Tesauro","year":"1989","journal-title":"Neural Comput."},{"key":"10.1016\/S1874-5946(98)80068-0_bib5","doi-asserted-by":"crossref","first-page":"295","DOI":"10.1016\/0893-6080(88)90003-2","article-title":"Increased rates of convergence through learning rate adaptation","volume":"1","author":"Jacobs","year":"1988","journal-title":"Neural Networks"},{"key":"10.1016\/S1874-5946(98)80068-0_bib6","article-title":"An empirical study of learning speed in backpropagation networks","author":"Fahlman","year":"1988"},{"key":"10.1016\/S1874-5946(98)80068-0_bib7","first-page":"517","article-title":"Speeding-up backpropagation\u2014a comparison of orthogonal techniques.","volume":"Vol. 1","author":"Pfister","year":"1993"},{"key":"10.1016\/S1874-5946(98)80068-0_bib8","article-title":"Optimization of the backpropagation algorithm for training multilayer perceptrons","author":"Schiffmann","year":"1992"},{"key":"10.1016\/S1874-5946(98)80068-0_bib9","series-title":"Advances in Neural Information Processing System 1","first-page":"107","article-title":"Skeletonization: A technique for trimming tha fat from a network via reelevance assessment","author":"Mozer","year":"1989"},{"key":"10.1016\/S1874-5946(98)80068-0_bib10","first-page":"326","article-title":"Neural net pruming\u2014why and how","volume":"Vol. I","author":"Sietsma","year":"1988"},{"key":"10.1016\/S1874-5946(98)80068-0_bib11","first-page":"749","article-title":"Curvature-driven smoothing in backpropagation neural networks","volume":"Vol. II","author":"Bishop","year":"1990"},{"key":"10.1016\/S1874-5946(98)80068-0_bib12","first-page":"643","article-title":"Dynamic behavior of constrained backpropagation networks","volume":"2","author":"Chauvin","year":"1990"},{"key":"10.1016\/S1874-5946(98)80068-0_bib13","first-page":"177","article-title":"Comparing biases for minimal network construction with backpropagation","author":"Hanson","year":"1989"},{"key":"10.1016\/S1874-5946(98)80068-0_bib14","doi-asserted-by":"crossref","first-page":"67","DOI":"10.1016\/0893-6080(91)90033-2","article-title":"Creating artificial neural networks that generalize","volume":"4","author":"Sietsma","year":"1991","journal-title":"Neural Networks"},{"key":"10.1016\/S1874-5946(98)80068-0_bib15","doi-asserted-by":"crossref","first-page":"365","DOI":"10.1080\/09540098908915647","article-title":"Dynamic node creation in backpropagation networks","volume":"1","author":"Ash","year":"1989","journal-title":"Connection Sci."},{"key":"10.1016\/S1874-5946(98)80068-0_bib16","series-title":"Advances in Neural Information Processing Systems","first-page":"524","article-title":"The cascade-correlation learning architecture","author":"Fahlman","year":"1990"},{"key":"10.1016\/S1874-5946(98)80068-0_bib17","doi-asserted-by":"crossref","first-page":"61","DOI":"10.1016\/0893-6080(91)90032-Z","article-title":"Backpropagation algorithm which varies the number of hidden units","volume":"4","author":"Hirose","year":"1991","journal-title":"Neural Networks"},{"key":"10.1016\/S1874-5946(98)80068-0_bib18","first-page":"598","article-title":"Initializations, backpropagations and generalizations of feedforward classifiers","volume":"Vol. 1","author":"Schmidt","year":"1993"},{"key":"10.1016\/S1874-5946(98)80068-0_bib19","article-title":"The use, of feed-forward and recurrent neural networks for system identification","author":"Burrows","year":"1993"},{"key":"10.1016\/S1874-5946(98)80068-0_bib20","series-title":"Proceedings of the 1990 IEEE International Conference on Systems, Man and Cybernetics","first-page":"370","article-title":"Optimal initialization for multilayer perceptrons","author":"Chen","year":"1990"},{"key":"10.1016\/S1874-5946(98)80068-0_bib21","doi-asserted-by":"crossref","first-page":"351","DOI":"10.1016\/0893-6080(93)90003-F","article-title":"Initializing back propagation networs with prototypes","volume":"6","author":"Denoeux","year":"1993","journal-title":"Neural Networks"},{"key":"10.1016\/S1874-5946(98)80068-0_bib22","doi-asserted-by":"crossref","first-page":"627","DOI":"10.1109\/72.143378","article-title":"Statistically controlled activation weight initialization (SCAWI)","volume":"3","author":"Drago","year":"1992","journal-title":"IEEE Trans. Neural Networks"},{"key":"10.1016\/S1874-5946(98)80068-0_bib23","series-title":"Proceedings of the 1994 IEEE International Conference on Neural Networks","first-page":"113","article-title":"Weight initialization of MLP classifiers using boundary-preserving patterns","author":"Kaylani","year":"1994"},{"key":"10.1016\/S1874-5946(98)80068-0_bib24","first-page":"1701","article-title":"Initializing weights to a hidden layer of a multilayer neural network by linear programming","volume":"Vol. 2","author":"Kim","year":"1993"},{"key":"10.1016\/S1874-5946(98)80068-0_bib25","first-page":"580","article-title":"Acceleration of back propagations through initial weights pretraining with delta rule","volume":"Vol. 1","author":"Li","year":"1993"},{"key":"10.1016\/S1874-5946(98)80068-0_bib26","first-page":"21","article-title":"Improving the learning speed of 2-layer of 2-layer neural networks by choosing initial values of the adaptive weights","volume":"Vol. 3","author":"Nquyen","year":"1990"},{"key":"10.1016\/S1874-5946(98)80068-0_bib27","series-title":"Proceedings of the International Conference on Artificial Neural Networks, ICANN'94","first-page":"577","article-title":"Optimal weight initiazation for neural networks","author":"Rojas","year":"1994"},{"key":"10.1016\/S1874-5946(98)80068-0_bib28","series-title":"Proceedings of the 6th International Conference on Tools with Artificial Intelligence, TAI'94","first-page":"672","article-title":"A weight value initialization method for improving learning performance of the backpropagation algorithm in neural networks","author":"Shimodaira","year":"1994"},{"key":"10.1016\/S1874-5946(98)80068-0_bib29","doi-asserted-by":"crossref","first-page":"899","DOI":"10.1109\/72.165592","article-title":"Avoiding false local minima by proper initialization of connections","volume":"3","author":"Wessels","year":"1992","journal-title":"IEEE Trans. Neural Networks"},{"key":"10.1016\/S1874-5946(98)80068-0_bib30","series-title":"Proceedings of the 1993 International Conference on Systems, Man and Cybernetics","first-page":"584","article-title":"Design and initialization of two-layer perceptrons using standard pattern recognition techniques","author":"Weymaere","year":"1993"},{"key":"10.1016\/S1874-5946(98)80068-0_bib31","author":"Fletcher","year":"1990"},{"key":"10.1016\/S1874-5946(98)80068-0_bib32","series-title":"Proceedings of the IEEE International Conference on Neural Networks","article-title":"A direct adaptive method for faster backpropagation learning: the Rprop algorithm","author":"Riedmiller","year":"1993"},{"key":"10.1016\/S1874-5946(98)80068-0_bib33","article-title":"Advanced supervised learning in multilayer perceptrons\u2014from backpropagation to adaptive learning algorithms. Special Issue on Neural Networks","volume":"5","author":"Riedmiller","year":"1994","journal-title":"Int. J. Comput. Standards Interfaces"},{"key":"10.1016\/S1874-5946(98)80068-0_bib34","series-title":"Proceedings of the 1988 Connectionist Models Summer School","first-page":"133","article-title":"Learning with localized receptive fields","author":"Moody","year":"1988"},{"key":"10.1016\/S1874-5946(98)80068-0_bib35","doi-asserted-by":"crossref","first-page":"281","DOI":"10.1162\/neco.1989.1.2.281","article-title":"Fast learning in networks of locally-tuned processing units","volume":"1","author":"Moody","year":"1989","journal-title":"Neural Comput."},{"key":"10.1016\/S1874-5946(98)80068-0_bib36","author":"Draper","year":"1966"},{"key":"10.1016\/S1874-5946(98)80068-0_bib37","author":"Seber","year":"1977"},{"key":"10.1016\/S1874-5946(98)80068-0_bib38","doi-asserted-by":"crossref","first-page":"982","DOI":"10.1162\/neco.1995.7.5.982","article-title":"Initializing weights of a multilayer perceptron network by using the orthogonal least squares algorithm","volume":"7","author":"Lehtokangas","year":"1995","journal-title":"Neural Comput."},{"key":"10.1016\/S1874-5946(98)80068-0_bib39","series-title":"Proceedings of the European Symposium on Artificial Neural Networks, ESANN'96","first-page":"243","article-title":"Maximum covariance method for weight initialization of multilayer perceptron network","author":"Lehtokangas","year":"1996"},{"key":"10.1016\/S1874-5946(98)80068-0_bib40","doi-asserted-by":"crossref","first-page":"302","DOI":"10.1109\/72.80341","article-title":"Orthogonal least squares learning algorithm for radial basis function networks","volume":"2","author":"Chen","year":"1991","journal-title":"IEEE Trans. Neural Networks"},{"key":"10.1016\/S1874-5946(98)80068-0_bib41","first-page":"378","article-title":"Orthogonal least-squares algorithm for training multioutput radial basis function networks","volume":"139","author":"Chen","year":"1992","journal-title":"IEE Proc. F"},{"key":"10.1016\/S1874-5946(98)80068-0_bib42","series-title":"Proceedings of the International Conference on Neural Networks, ICNN'96","first-page":"176","article-title":"Fast hidden node selection methods for training radial basis function networks. Plenary, panel and special sessions","author":"Lehtokangas","year":"1996"},{"key":"10.1016\/S1874-5946(98)80068-0_bib43","doi-asserted-by":"crossref","first-page":"199","DOI":"10.1109\/5.265347","article-title":"Applications of voice processing to telecommunications","volume":"82","author":"Rabiner","year":"1994","journal-title":"Proc. IEEE"},{"key":"10.1016\/S1874-5946(98)80068-0_bib44","doi-asserted-by":"crossref","first-page":"1214","DOI":"10.1109\/5.237532","article-title":"Signal modeling techniques in speech recognition","volume":"81","author":"Picone","year":"1993","journal-title":"Proc. IEEE"},{"key":"10.1016\/S1874-5946(98)80068-0_bib45","doi-asserted-by":"crossref","first-page":"52","DOI":"10.1109\/TASSP.1986.1164788","article-title":"Speaker independent isolated word recognition using dynamic features of speech spectrum","volume":"34","author":"Furui","year":"1986","journal-title":"IEEE Trans. Acoustic Speech Signal Processing"},{"key":"10.1016\/S1874-5946(98)80068-0_bib46","author":"Kohonen","year":"1995"},{"key":"10.1016\/S1874-5946(98)80068-0_bib47","doi-asserted-by":"crossref","first-page":"541","DOI":"10.1016\/0167-6393(90)90029-9","article-title":"Using self-organizing maps and multi-layered feed-forward nets to obtain phonemic transcription of spoken utterances","volume":"9","author":"Kokkonen","year":"1990","journal-title":"Speech Commun."},{"key":"10.1016\/S1874-5946(98)80068-0_bib48","doi-asserted-by":"crossref","first-page":"2651","DOI":"10.1109\/78.165652","article-title":"A combined self-organizing feature map and multilayer perceptron for isolated word recognition","volume":"40","author":"Zezhen","year":"1992","journal-title":"IEEE Trans. Signal Processing"},{"key":"10.1016\/S1874-5946(98)80068-0_bib49","first-page":"42.11","article-title":"A database of speaker-independent digit recognition","volume":"Vol. 3","author":"Leonard","year":"1984"},{"key":"10.1016\/S1874-5946(98)80068-0_bib50","author":"Kohonen","year":"1995"},{"key":"10.1016\/S1874-5946(98)80068-0_bib51","author":"Math Works Inc.","year":"1994","journal-title":"MATLAB for Windows version 4.2c.1"},{"key":"10.1016\/S1874-5946(98)80068-0_bib52","first-page":"1912","article-title":"Isolated spoken number recognition with hybrid of self-organizing map and multilayer perceptron","volume":"Vol. 4","author":"Salmela","year":"1996"},{"key":"10.1016\/S1874-5946(98)80068-0_bib53","doi-asserted-by":"crossref","first-page":"257","DOI":"10.1007\/BF00332914","article-title":"Accelerating the convergence of the backpropagation method","volume":"59","author":"Vogl","year":"1988","journal-title":"Biological Cybernetics"},{"key":"10.1016\/S1874-5946(98)80068-0_bib54","author":"Haykin","year":"1994"},{"key":"10.1016\/S1874-5946(98)80068-0_bib55","doi-asserted-by":"crossref","first-page":"74","DOI":"10.1049\/ip-cds:19951630","article-title":"A novel technology independent neural network approach on device modelling interface","volume":"142","author":"Ojala","year":"1995","journal-title":"IEEE Proc. G, Circuits, Devices and Systems"},{"key":"10.1016\/S1874-5946(98)80068-0_bib56","article-title":"Proben 1\u2014a set of neural network benchmark problems and benchmarking rules","author":"Prechelt","year":"1994"}],"container-title":["Neural Network Systems Techniques and Applications","Algorithms and Architectures"],"original-title":[],"deposited":{"date-parts":[[2018,12,29]],"date-time":"2018-12-29T21:22:05Z","timestamp":1546118525000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1874594698800680"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1998]]},"references-count":56,"URL":"https:\/\/doi.org\/10.1016\/s1874-5946(98)80068-0","relation":{},"ISSN":["1874-5946"],"issn-type":[{"value":"1874-5946","type":"print"}],"subject":[],"published":{"date-parts":[[1998]]}}}