{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,19]],"date-time":"2025-09-19T09:22:08Z","timestamp":1758273728527,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":31,"publisher":"ACM","license":[{"start":{"date-parts":[[2019,7,25]],"date-time":"2019-07-25T00:00:00Z","timestamp":1564012800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["1546459"],"award-info":[{"award-number":["1546459"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2019,7,25]]},"DOI":"10.1145\/3292500.3330837","type":"proceedings-article","created":{"date-parts":[[2019,7,26]],"date-time":"2019-07-26T13:17:26Z","timestamp":1564147046000},"page":"1460-1470","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["Scaling Multinomial Logistic Regression via Hybrid Parallelism"],"prefix":"10.1145","author":[{"given":"Parameswaran","family":"Raman","sequence":"first","affiliation":[{"name":"University of California Santa Cruz, Santa Cruz, CA, USA"}]},{"given":"Sriram","family":"Srinivasan","sequence":"additional","affiliation":[{"name":"University of California Santa Cruz, Santa Cruz, CA, USA"}]},{"given":"Shin","family":"Matsushima","sequence":"additional","affiliation":[{"name":"University of Tokyo, Tokyo, Japan"}]},{"given":"Xinhua","family":"Zhang","sequence":"additional","affiliation":[{"name":"University of Illinios Chicago, Chicago, IL, USA"}]},{"given":"Hyokun","family":"Yun","sequence":"additional","affiliation":[{"name":"Amazon, Seattle, WA, USA"}]},{"given":"S.V.N.","family":"Vishwanathan","sequence":"additional","affiliation":[{"name":"Amazon, Palo Alto, CA, USA"}]}],"member":"320","published-online":{"date-parts":[[2019,7,25]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/2488388.2488391"},{"key":"e_1_3_2_1_2_1","first-page":"1","article-title":"Incremental gradient, subgradient, and proximal methods for convex optimization: A survey","author":"Bertsekas D. P.","year":"2010","journal-title":"Optimization for Machine Learning"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-7908-2604-3_16"},{"volume-title":"Efficient bounds for the softmax function, applications to inference in hybrid models","year":"2007","author":"Bouchard G.","key":"e_1_3_2_1_4_1"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1561\/2200000016"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.5555\/993483"},{"key":"e_1_3_2_1_7_1","first-page":"281","volume-title":"Advances in neural information processing systems","author":"Chu C.-T.","year":"2007"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/1864708.1864770"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/2020408.2020426"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.5555\/3086952"},{"key":"e_1_3_2_1_11_1","first-page":"289","volume-title":"Proceedings of the 30th International Conference on Machine Learning (ICML-13)","author":"Gopal S.","year":"2013"},{"volume-title":"Random shuffling beats sgd after finite epochs. arXiv preprint arXiv:1806.10077","year":"2018","author":"HaoChen J. Z.","key":"e_1_3_2_1_12_1"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939756"},{"volume-title":"Big Learning NIPS Workshop","year":"2013","author":"Li M.","key":"e_1_3_2_1_14_1"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4757-6594-6_11"},{"volume-title":"Introductory lectures on convex optimization: A basic course","year":"2013","author":"Nesterov Y.","key":"e_1_3_2_1_16_1"},{"key":"e_1_3_2_1_17_1","series-title":"Springer Series in Operations Research","volume-title":"Numerical Optimization","author":"Nocedal J.","year":"2006","edition":"2"},{"key":"e_1_3_2_1_18_1","first-page":"693","volume-title":"Advances in Neural Information Processing Systems","author":"Recht B.","year":"2011"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177729586"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"e_1_3_2_1_21_1","first-page":"46","volume-title":"Advances in Neural Information Processing Systems","author":"Shamir O.","year":"2016"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/2987550.2987586"},{"volume-title":"Dscovr: Randomized primal-dual block coordinate algorithms for asynchronous distributed optimization. arXiv preprint arXiv:1710.05080","year":"2017","author":"Xiao L.","key":"e_1_3_2_1_23_1"},{"volume-title":"CoRR","year":"2015","author":"Xie P.","key":"e_1_3_2_1_24_1"},{"key":"e_1_3_2_1_25_1","article-title":"Petuum: a new platform for distributed machine learning on big data. Big Data","author":"Xing E. P.","year":"2015","journal-title":"IEEE Transactions on"},{"key":"e_1_3_2_1_26_1","first-page":"3069","volume-title":"Proceedings of The 33rd International Conference on Machine Learning","author":"Yen I. E.-H.","year":"2016"},{"volume-title":"Advances in Neural Information Processing Systems","year":"2014","author":"Yun H.","key":"e_1_3_2_1_28_1"},{"volume-title":"Nomad: Non-locking, stochastic multi-machine algorithm for asynchronous and decentralized matrix completion","year":"2013","author":"Yun H.","key":"e_1_3_2_1_29_1"},{"volume-title":"Taming convergence for asynchronous stochastic gradient descent with unbounded delay in non-convex learning. arXiv preprint arXiv:1805.09470","year":"2018","author":"Zhang X.","key":"e_1_3_2_1_30_1"},{"volume-title":"A fast parallel stochastic gradient method for matrix factorization in shared memory systems","year":"2013","author":"Zhuang Y.","key":"e_1_3_2_1_31_1"},{"key":"e_1_3_2_1_32_1","first-page":"2595","volume-title":"Advances in Neural Information Processing Systems","author":"Zinkevich M.","year":"2010"}],"event":{"name":"KDD '19: The 25th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data"],"location":"Anchorage AK USA","acronym":"KDD '19"},"container-title":["Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery &amp; Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3292500.3330837","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3292500.3330837","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3292500.3330837","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T00:26:02Z","timestamp":1750206362000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3292500.3330837"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,7,25]]},"references-count":31,"alternative-id":["10.1145\/3292500.3330837","10.1145\/3292500"],"URL":"https:\/\/doi.org\/10.1145\/3292500.3330837","relation":{},"subject":[],"published":{"date-parts":[[2019,7,25]]},"assertion":[{"value":"2019-07-25","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}