{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T18:45:09Z","timestamp":1772822709905,"version":"3.50.1"},"reference-count":21,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,12]]},"DOI":"10.1109\/icpr.2016.7900183","type":"proceedings-article","created":{"date-parts":[[2017,4,24]],"date-time":"2017-04-24T17:12:47Z","timestamp":1493053967000},"page":"3542-3547","source":"Crossref","is-referenced-by-count":16,"title":["Faster training of very deep networks via p-norm gates"],"prefix":"10.1109","author":[{"given":"Trang","family":"Pham","sequence":"first","affiliation":[]},{"given":"Truyen","family":"Tran","sequence":"additional","affiliation":[]},{"given":"Dinh","family":"Phung","sequence":"additional","affiliation":[]},{"given":"Svetha","family":"Venkatesh","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","first-page":"1319","article-title":"Maxout networks","author":"goodfellow","year":"2013","journal-title":"Proceedings of The 30th InternationalConference on Machine Learning"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref12","article-title":"Generating sequences with recurrent neural networks","author":"graves","year":"2013","journal-title":"arXiv preprint arXiv 1308 0850"},{"key":"ref13","first-page":"2368","article-title":"Training very deep networks","author":"srivastava","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref14","article-title":"Deep residual learning for image recognition","author":"he","year":"2015","journal-title":"arXiv preprint arXiv 1512 03385"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/W14-4012"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1179"},{"key":"ref17","article-title":"Empirical evaluation of gated recurrent neural networks on sequence modeling","author":"chung","year":"2014","journal-title":"arXiv preprint arXiv 1412 3555"},{"key":"ref18","author":"mikolov","year":"2012","journal-title":"Subword language modeling with neural networks"},{"key":"ref19","article-title":"Character-aware neural language models","author":"kim","year":"2015","journal-title":"arXiv preprint arXiv 1508 06615"},{"key":"ref4","article-title":"Ask me anything: Dynamic memory networks for natural language processing","author":"kumar","year":"2015","journal-title":"arXiv preprint arXiv 1506 01070"},{"key":"ref3","first-page":"3104","article-title":"Sequence to sequence learning with neural networks","author":"sutskever","year":"2014","journal-title":"Advances in neural information processing systems"},{"key":"ref6","first-page":"192","article-title":"The loss surfaces of multilayer networks","author":"choromanska","year":"2015","journal-title":"International Conference on Artificial Intelligence and Statistics"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1561\/2200000006"},{"key":"ref8","article-title":"Gradient flow in recurrent nets: the difficulty of learning long-term dependencies","author":"hochreiter","year":"2001","journal-title":"A Field Guide to Dynamical Recurrent Neural Networks"},{"key":"ref7","first-page":"1","article-title":"Exploring strategies for training deep neural networks","volume":"10","author":"larochelle","year":"2009","journal-title":"The Journal of Machine Learning Research"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2012.2205597"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.123"},{"key":"ref9","first-page":"315","article-title":"Deep sparse rectifier networks","volume":"15","author":"glorot","year":"2011","journal-title":"Proceedings of the 14th InternationalConference on Artificial Intelligence and Statistics JMLR W&CP Volume"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-31750-2_3"},{"key":"ref21","article-title":"Regularizing RNNs by Stabilizing Activations","author":"krueger","year":"2015","journal-title":"arXiv preprint arXiv 1511 05271"}],"event":{"name":"2016 23rd International Conference on Pattern Recognition (ICPR)","location":"Cancun","start":{"date-parts":[[2016,12,4]]},"end":{"date-parts":[[2016,12,8]]}},"container-title":["2016 23rd International Conference on Pattern Recognition (ICPR)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7893644\/7899596\/07900183.pdf?arnumber=7900183","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,12,13]],"date-time":"2017-12-13T15:17:13Z","timestamp":1513178233000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7900183\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,12]]},"references-count":21,"URL":"https:\/\/doi.org\/10.1109\/icpr.2016.7900183","relation":{},"subject":[],"published":{"date-parts":[[2016,12]]}}}