{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,19]],"date-time":"2026-02-19T02:48:57Z","timestamp":1771469337829,"version":"3.50.1"},"reference-count":21,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,12]]},"DOI":"10.1109\/bigdata.2016.7840590","type":"proceedings-article","created":{"date-parts":[[2017,2,7]],"date-time":"2017-02-07T16:46:59Z","timestamp":1486486019000},"page":"66-75","source":"Crossref","is-referenced-by-count":24,"title":["Predicting statistics of asynchronous SGD parameters for a large-scale distributed deep learning system on GPU supercomputers"],"prefix":"10.1109","author":[{"given":"Yosuke","family":"Oyama","sequence":"first","affiliation":[]},{"given":"Akihiro","family":"Nomura","sequence":"additional","affiliation":[]},{"given":"Ikuro","family":"Sato","sequence":"additional","affiliation":[]},{"given":"Hiroki","family":"Nishimura","sequence":"additional","affiliation":[]},{"given":"Yukimasa","family":"Tamatsu","sequence":"additional","affiliation":[]},{"given":"Satoshi","family":"Matsuoka","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","article-title":"Staleness-aware async-sgd for distributed deep learning","author":"zhang","year":"2015","journal-title":"arXiv preprint arXiv 1511 05271"},{"key":"ref11","article-title":"Distributed asynchronous optimization of convolutional neural networks","author":"chan","year":"0","journal-title":"Proc INTERSPEECH 2014"},{"key":"ref12","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2014","journal-title":"arXiv preprint arXiv 1409 1556"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/2783258.2783270"},{"key":"ref14","first-page":"571","article-title":"Project adam: Building an efficient and scalable deep learning training system","author":"chilimbi","year":"2014","journal-title":"11 th USENIX Symposium on Operating Systems Design and Implementation (OSDI 14)"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref16","first-page":"2121","article-title":"Adaptive subgradient methods for online learning and stochastic optimization","volume":"12","author":"duchi","year":"2011","journal-title":"J Mach Learn Res"},{"key":"ref17","first-page":"1","article-title":"Rectifier nonlinearities improve neural network acoustic models","volume":"30","author":"maas","year":"2013","journal-title":"Proc ICML"},{"key":"ref18","article-title":"Highway networks","author":"srivastava","year":"2015","journal-title":"arXiv preprint arXiv 1505 03561"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"ref4","article-title":"Deep speech 2: End-to-end speech recognition in english and mandarin","author":"amodei","year":"2015","journal-title":"arXiv preprint arXiv 1512 00327"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.123"},{"key":"ref6","article-title":"One weird trick for parallelizing convolutional neural networks","author":"krizhevsky","year":"2014","journal-title":"arXiv preprint arXiv 1404 5997"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6638950"},{"key":"ref8","article-title":"Firecaffe: near-linear acceleration of deep neural network training on compute clusters","author":"iandola","year":"2015","journal-title":"arXiv preprint arXiv 1511 05271"},{"key":"ref7","first-page":"1232","article-title":"Large scale distributed deep networks","author":"dean","year":"2012","journal-title":"Advances in Neural Information Processing Systems 25"},{"key":"ref2","article-title":"Deep image: Scaling up image recognition","volume":"7","author":"wu","year":"2015","journal-title":"arXiv preprint arXiv 1501 02876"},{"key":"ref1","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"Advances in Neural Information Processing Systems 25"},{"key":"ref9","article-title":"Model accuracy and runtime tradeoff in distributed deep learning","author":"gupta","year":"2015","journal-title":"arXiv preprint arXiv 1509 04210"},{"key":"ref20","article-title":"Notes on convolutional neural networks","author":"bouvrie","year":"2006"},{"key":"ref21","first-page":"1737","article-title":"Deep learning with limited numerical precision","author":"gupta","year":"2015","journal-title":"Proceedings of the 32nd International Conference on Machine Learning (ICML-15)"}],"event":{"name":"2016 IEEE International Conference on Big Data (Big Data)","location":"Washington DC,USA","start":{"date-parts":[[2016,12,5]]},"end":{"date-parts":[[2016,12,8]]}},"container-title":["2016 IEEE International Conference on Big Data (Big Data)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7818133\/7840573\/07840590.pdf?arnumber=7840590","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,3,1]],"date-time":"2017-03-01T17:42:15Z","timestamp":1488390135000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7840590\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,12]]},"references-count":21,"URL":"https:\/\/doi.org\/10.1109\/bigdata.2016.7840590","relation":{},"subject":[],"published":{"date-parts":[[2016,12]]}}}