{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,28]],"date-time":"2025-09-28T20:34:27Z","timestamp":1759091667794,"version":"3.40.4"},"publisher-location":"Berlin, Heidelberg","reference-count":35,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642352881"},{"type":"electronic","value":"9783642352898"}],"license":[{"start":{"date-parts":[[2012,1,1]],"date-time":"2012-01-01T00:00:00Z","timestamp":1325376000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2012]]},"DOI":"10.1007\/978-3-642-35289-8_31","type":"book-chapter","created":{"date-parts":[[2012,11,14]],"date-time":"2012-11-14T12:03:17Z","timestamp":1352894597000},"page":"581-598","source":"Crossref","is-referenced-by-count":24,"title":["Deep Big Multilayer Perceptrons for Digit Recognition"],"prefix":"10.1007","author":[{"given":"Dan Claudiu","family":"Cire\u015fan","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ueli","family":"Meier","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Luca Maria","family":"Gambardella","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"J\u00fcrgen","family":"Schmidhuber","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"key":"31_CR1","doi-asserted-by":"crossref","unstructured":"Bengio, Y., Lamblin, P., Popovici, D., Larochelle, H.: Greedy layer-wise training of deep networks. In: Neural Information Processing Systems (2006)","DOI":"10.7551\/mitpress\/7503.003.0024"},{"key":"31_CR2","unstructured":"Bishop, C.M.: Pattern Recognition and Machine Learning. Springer (2006)"},{"key":"31_CR3","first-page":"123","volume":"24","author":"L. Breiman","year":"1996","unstructured":"Breiman, L.: Bagging predictors. Machine Learning\u00a024, 123\u2013140 (1996)","journal-title":"Machine Learning"},{"key":"31_CR4","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"358","DOI":"10.1007\/11669487_32","volume-title":"Document Analysis Systems VII","author":"K. Chellapilla","year":"2006","unstructured":"Chellapilla, K., Shilman, M., Simard, P.: Combining Multiple Classifiers for Faster Optical Character Recognition. In: Bunke, H., Spitz, A.L. (eds.) DAS 2006. LNCS, vol.\u00a03872, pp. 358\u2013367. Springer, Heidelberg (2006)"},{"key":"31_CR5","unstructured":"Chellapilla, K., Puri, S., Simard, P.: High performance convolutional neural networks for document processing. In: International Workshop on Frontiers in Handwriting Recognition (2006)"},{"issue":"12","key":"31_CR6","doi-asserted-by":"publisher","first-page":"3207","DOI":"10.1162\/NECO_a_00052","volume":"22","author":"D.C. Ciresan","year":"2010","unstructured":"Ciresan, D.C., Meier, U., Gambardella, L.M., Schmidhuber, J.: Deep, big, simple neural nets for handwritten digit recognition. Neural Computation\u00a022(12), 3207\u20133220 (2010)","journal-title":"Neural Computation"},{"key":"31_CR7","unstructured":"Ciresan, D.C., Meier, U., Gambardella, L.M., Schmidhuber, J.: Handwritten Digit Recognition with a Committee of Deep Neural Nets on GPUs. Technical Report IDSIA-03-11, Istituto Dalle Molle di Studi sull\u2019Intelligenza Artificiale, IDSIA (2011)"},{"key":"31_CR8","doi-asserted-by":"crossref","unstructured":"Ciresan, D.C., Meier, U., Gambardella, L.M., Schmidhuber, J.: Convolutional neural network committees for handwritten character recognition. In: International Conference on Document Analysis and Recognition, pp. 1135\u20131139 (2011)","DOI":"10.1109\/ICDAR.2011.229"},{"key":"31_CR9","doi-asserted-by":"crossref","unstructured":"Ciresan, D.C., Meier, U., Masci, J., Schmidhuber, J.: A committee of neural networks for traffic sign classification. In: International Joint Conference on Neural Networks, pp. 1918\u20131921 (2011)","DOI":"10.1109\/IJCNN.2011.6033458"},{"key":"31_CR10","unstructured":"Ciresan, D.C., Meier, U., Masci, J., Gambardella, L.M., Schmidhuber, J.: Flexible, high performance convolutional neural networks for image classification. In: International Joint Conference on Artificial Intelligence, pp. 1237\u20131242 (2011)"},{"key":"31_CR11","doi-asserted-by":"crossref","unstructured":"Ciresan, D.C., Meier, U., Schmidhuber, J.: Multi-column deep neural networks for image classification. In: Computer Vision and Pattern Recognition, pp. 3642\u20133649 (2012)","DOI":"10.1109\/CVPR.2012.6248110"},{"key":"31_CR12","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1016\/j.neunet.2012.02.023","volume":"32","author":"D.C. Ciresan","year":"2012","unstructured":"Ciresan, D.C., Meier, U., Masci, J., Schmidhuber, J.: Multi-column deep neural network for traffic sign classification. Neural Networks\u00a032, 333\u2013338 (2012)","journal-title":"Neural Networks"},{"key":"31_CR13","doi-asserted-by":"crossref","unstructured":"Decoste, D., Scholkopf, B.: Training invariant support vector machines. Machine Learning\u00a0(46), 161\u2013190 (2002)","DOI":"10.1023\/A:1012454411458"},{"key":"31_CR14","doi-asserted-by":"crossref","unstructured":"Hinton, G.E., Salakhutdinov, R.R.: Reducing the dimensionality of data with neural networks. Science 313 (2006)","DOI":"10.1126\/science.1127647"},{"key":"31_CR15","doi-asserted-by":"crossref","unstructured":"Hinton, G.E.: To recognize shapes, first learn to generate images. Computational Neuroscience: Theoretical Insights into Brain Function (2007)","DOI":"10.1016\/S0079-6123(06)65034-6"},{"key":"31_CR16","unstructured":"Hochreiter, S.: Untersuchungen zu dynamischen neuronalen Netzen. Diploma thesis, Institut f\u00fcr Informatik, Lehrstuhl Prof. Brauer, Technische Universit\u00e4t M\u00fcnchen (1991), http:\/\/www7.informatik.tu-muenchen.de\/~hochreit ; advisor: J. Schmidhuber"},{"key":"31_CR17","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S. Hochreiter","year":"1997","unstructured":"Hochreiter, S., Schmidhuber, J.: Long short-term memory. Neural Computation\u00a09, 1735\u20131780 (1997)","journal-title":"Neural Computation"},{"key":"31_CR18","unstructured":"Hochreiter, S., Bengio, Y., Frasconi, P., Schmidhuber, J.: Gradient flow in recurrent nets: the difficulty of learning long-term dependencies. In: Kremer, S.C., Kolen, J.F. (eds.) A Field Guide to Dynamical Recurrent Neural Networks. IEEE Press (2001)"},{"key":"31_CR19","doi-asserted-by":"crossref","unstructured":"Lauer, F., Suen, C., Bloch, G.: A trainable feature extractor for handwritten digit recognition. Pattern Recognition (40), 1816\u20131824 (2007)","DOI":"10.1016\/j.patcog.2006.10.011"},{"key":"31_CR20","unstructured":"LeCun, Y.: Une proc\u00e9dure d\u2019apprentissage pour r\u00e9seau a seuil asymmetrique (a learning scheme for asymmetric threshold networks). In: Proceedings of Cognitiva 1985, Paris, France, pp. 599\u2013604 (1985)"},{"issue":"11","key":"31_CR21","doi-asserted-by":"publisher","first-page":"2278","DOI":"10.1109\/5.726791","volume":"86","author":"Y. LeCun","year":"1998","unstructured":"LeCun, Y., Bottou, L., Bengio, Y., Haffner, P.: Gradient-based learning applied to document recognition. Proceedings of the IEEE\u00a086(11), 2278\u20132324 (1998)","journal-title":"Proceedings of the IEEE"},{"key":"31_CR22","doi-asserted-by":"crossref","unstructured":"Meier, U., Ciresan, D.C., Gambardella, L.M., Schmidhuber, J.: Better digit recognition with a committee of simple neural nets. In: ICDAR, pp. 1135\u20131139 (2011)","DOI":"10.1109\/ICDAR.2011.252"},{"key":"31_CR23","unstructured":"Mohamed, A., Dahl, G., Hinton, G.E.: Deep belief networks for phone recognition. In: Proc. of NIPS 2009 Workshop on Deep Learning for Speech Recognition and Related Applications (2009)"},{"key":"31_CR24","unstructured":"Nair, V., Hinton, G.E.: 3D object recognition with deep belief nets. In: Advances in Neural Information Processing Systems (2009)"},{"key":"31_CR25","unstructured":"NVIDIA: NVIDIA CUDA. Reference Manual, vol. 2.3. NVIDIA (2009)"},{"key":"31_CR26","doi-asserted-by":"crossref","unstructured":"Ranzato, M., Poultney, C., Chopra, S., LeCun, Y.: Efficient learning of sparse representations with an energy-based model. In: Platt, J., et al. (eds.) Advances in Neural Information Processing Systems (NIPS 2006). MIT Press (2006)","DOI":"10.7551\/mitpress\/7503.003.0147"},{"key":"31_CR27","doi-asserted-by":"crossref","unstructured":"Ranzato, M.: Fu Jie Huang, Y.L.B., LeCun, Y.: Unsupervised learning of invariant feature hierarchies with applications to object recognition. In: Proc. of Computer Vision and Pattern Recognition Conference (2007)","DOI":"10.1109\/CVPR.2007.383157"},{"key":"31_CR28","unstructured":"Ruetsch, G., Micikevicius, P.: Optimizing matrix transpose in cuda. In: NVIDIA GPU Computing SDK, pp. 1\u20132 (2009)"},{"key":"31_CR29","doi-asserted-by":"crossref","first-page":"318","DOI":"10.7551\/mitpress\/5236.001.0001","volume-title":"Parallel Distributed Processing: Explorations in the Microstructure of Cognition","author":"D.E. Rumelhart","year":"1986","unstructured":"Rumelhart, D.E., Hinton, G.E., Williams, R.J.: Learning internal representations by error propagation. In: Parallel Distributed Processing: Explorations in the Microstructure of Cognition, vol.\u00a01: Foundations, pp. 318\u2013362. MIT Press, Cambridge (1986)"},{"key":"31_CR30","volume-title":"Artificial Intelligence: A Modern Approach","author":"S. Russell","year":"2003","unstructured":"Russell, S., Norvig, P.: Artificial Intelligence: A Modern Approach, 2nd edn. Prentice-Hall, Englewood Cliffs (2003)","edition":"2"},{"key":"31_CR31","unstructured":"Salakhutdinov, R., Hinton, G.: Learning a nonlinear embedding by preserving class neighborhood structure. In: Proc. of the International Conference on Artificial Intelligence and Statistics, vol.\u00a011 (2007)"},{"key":"31_CR32","doi-asserted-by":"crossref","unstructured":"Scherer, D., Behnke, S.: Accelerating large-scale convolutional neural networks with parallel graphics multiprocessors. In: Proc. of NIPS 2009 Workshop on Large-Scale Machine Learning: Parallelism and Massive Datasets (2009)","DOI":"10.1007\/978-3-642-15825-4_9"},{"key":"31_CR33","doi-asserted-by":"crossref","unstructured":"Simard, P., Steinkraus, D., Platt, J.C.: Best practices for convolutional neural networks applied to visual document analysis. In: Seventh International Conference on Document Analysis and Recognition, pp. 958\u2013963 (2003)","DOI":"10.1109\/ICDAR.2003.1227801"},{"key":"31_CR34","doi-asserted-by":"crossref","unstructured":"Steinkraus, D., Simard, P.Y.: Gpus for machine learning algorithms. In: International Conference on Document Analysis and Recognition, pp. 1115\u20131120 (2005)","DOI":"10.1109\/ICDAR.2005.251"},{"key":"31_CR35","unstructured":"Werbos, P.J.: Beyond Regression: New Tools for Prediction and Analysis in the Behavioral Sciences. PhD thesis, Harvard University (1974)"}],"container-title":["Lecture Notes in Computer Science","Neural Networks: Tricks of the Trade"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-35289-8_31","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,20]],"date-time":"2025-04-20T21:28:31Z","timestamp":1745184511000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-35289-8_31"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012]]},"ISBN":["9783642352881","9783642352898"],"references-count":35,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-35289-8_31","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2012]]}}}