{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,5,15]],"date-time":"2025-05-15T04:47:14Z","timestamp":1747284434516,"version":"3.28.0"},"reference-count":33,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014,7]]},"DOI":"10.1109\/ijcnn.2014.6889433","type":"proceedings-article","created":{"date-parts":[[2014,9,10]],"date-time":"2014-09-10T10:30:33Z","timestamp":1410345033000},"page":"4062-4069","source":"Crossref","is-referenced-by-count":46,"title":["Large scale recurrent neural network on GPU"],"prefix":"10.1109","author":[{"given":"Boxun","family":"Li","sequence":"first","affiliation":[]},{"given":"Erjin","family":"Zhou","sequence":"additional","affiliation":[]},{"given":"Bo","family":"Huang","sequence":"additional","affiliation":[]},{"given":"Jiayi","family":"Duan","sequence":"additional","affiliation":[]},{"given":"Yu","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Ningyi","family":"Xu","sequence":"additional","affiliation":[]},{"given":"Jiaxing","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Huazhong","family":"Yang","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"19","volume":"2","author":"jurafsky","year":"0","journal-title":"Speech and Language Processing An Introduction to Natural Language Processing Computational Linguistics and Speech Recognition"},{"key":"17","first-page":"265","article-title":"On optimization methods for deep learning","author":"ngiam","year":"2011","journal-title":"Proceedings of the 28th International Conference on Machine Learning (ICML-11)"},{"key":"18","article-title":"A guide to recurrent neural networks and backpropagation","author":"bod\ufffdn","year":"2002","journal-title":"Dallas Project SICS Technical Report"},{"key":"33","first-page":"2265","article-title":"Learning word embeddings efficiently with noise-contrastive estimation","author":"mnih","year":"2013","journal-title":"NIPS"},{"key":"15","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO.2007.30"},{"key":"16","doi-asserted-by":"publisher","DOI":"10.1145\/1553374.1553486"},{"journal-title":"On the Difficulty of Training Recurrent Neural Networks","year":"2012","author":"pascanu","key":"13"},{"key":"14","first-page":"1337","article-title":"Deep learning with cots hpc systems","volume":"28","author":"coates","year":"2013","journal-title":"Proceedings of the 30th International Conference on Machine Learning (ICML-13)"},{"key":"11","first-page":"1033","article-title":"Learning recurrent neural networks with hessian-free optimization","author":"martens","year":"2011","journal-title":"Proceedings of the 28th International Conference on Machine Learning (ICML-11)"},{"key":"12","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2011.6163930"},{"journal-title":"Statistical Methods for Speech Recognition","year":"1997","author":"jelinek","key":"21"},{"key":"20","first-page":"258","article-title":"Faster and smaller n-gram language models","author":"pauls","year":"2011","journal-title":"ACL"},{"key":"22","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2011.5947611"},{"key":"23","doi-asserted-by":"crossref","first-page":"1045","DOI":"10.21437\/Interspeech.2010-343","article-title":"Recurrent neural network based language model","author":"mikolov","year":"2010","journal-title":"InterSpeech"},{"journal-title":"Intel Math Kernel Library","year":"0","author":"intel","key":"24"},{"key":"25","article-title":"Cublas library","volume":"15","author":"nvidia","year":"2008","journal-title":"NVIDIA Corporation Santa Clara California"},{"key":"26","first-page":"16","article-title":"Rnnlm-recurrent neural network language modeling toolkit","author":"mikolov","year":"2011","journal-title":"Proc IEEE Workshop on Automatic Speech Recognition and Understanding"},{"key":"27","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2008.5214359"},{"key":"28","doi-asserted-by":"publisher","DOI":"10.1145\/2155620.2155656"},{"journal-title":"GPU Computing SDK","year":"0","author":"nvidia","key":"29"},{"key":"3","doi-asserted-by":"crossref","first-page":"267","DOI":"10.1016\/j.future.2009.01.001","article-title":"Study of neural net training methods in parallel and distributed architectures","volume":"26","author":"men\ufffdndez de llano","year":"2010","journal-title":"Future Generation Computer Systems"},{"journal-title":"Modern Nonparametric Methods in Machine Learning","year":"0","author":"n workshop","key":"2"},{"key":"10","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2007.370428"},{"key":"1","first-page":"24","article-title":"Are you ready for the era of big data?","volume":"4","author":"brown","year":"2011","journal-title":"McKinsey Quarterly"},{"key":"30","first-page":"313","article-title":"Building a large annotated corpus of english: The penn treebank","volume":"19","author":"marcus","year":"1993","journal-title":"Computational Linguistics"},{"key":"7","first-page":"1017","article-title":"Generating text with recurrent neural networks","author":"sutskever","year":"2011","journal-title":"Proceedings of the 28th International Conference on Machine Learning (ICML-11)"},{"key":"6","doi-asserted-by":"publisher","DOI":"10.1145\/2505515.2514699"},{"journal-title":"Statistical Language Models Based on Neural Networks","year":"2012","author":"mikolov","key":"32"},{"key":"5","article-title":"Large scale distributed deep networks","author":"dean","year":"2012","journal-title":"NIPS"},{"key":"31","first-page":"29","article-title":"A challenge set for advancing language modeling","author":"zweig","year":"2012","journal-title":"NAACL-HLT 2012 Workshop Will We Ever Really Replace the N-gram Model? on the Future of Language Modeling for HLT"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-7012(00)00201-3"},{"key":"9","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6639345"},{"key":"8","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1989.1.2.270"}],"event":{"name":"2014 International Joint Conference on Neural Networks (IJCNN)","start":{"date-parts":[[2014,7,6]]},"location":"Beijing, China","end":{"date-parts":[[2014,7,11]]}},"container-title":["2014 International Joint Conference on Neural Networks (IJCNN)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6880678\/6889358\/06889433.pdf?arnumber=6889433","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,4,16]],"date-time":"2022-04-16T15:45:21Z","timestamp":1650123921000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/6889433"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,7]]},"references-count":33,"URL":"https:\/\/doi.org\/10.1109\/ijcnn.2014.6889433","relation":{},"subject":[],"published":{"date-parts":[[2014,7]]}}}