{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,28]],"date-time":"2026-02-28T07:35:36Z","timestamp":1772264136427,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":31,"publisher":"ACM","license":[{"start":{"date-parts":[[2019,7,25]],"date-time":"2019-07-25T00:00:00Z","timestamp":1564012800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2019,7,25]]},"DOI":"10.1145\/3292500.3330765","type":"proceedings-article","created":{"date-parts":[[2019,7,26]],"date-time":"2019-07-26T13:17:26Z","timestamp":1564147046000},"page":"2232-2240","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":141,"title":["FDML"],"prefix":"10.1145","author":[{"given":"Yaochen","family":"Hu","sequence":"first","affiliation":[{"name":"University of Alberta, Edmonton, Canada"}]},{"given":"Di","family":"Niu","sequence":"additional","affiliation":[{"name":"University of Alberta, Edmonton, Canada"}]},{"given":"Jianming","family":"Yang","sequence":"additional","affiliation":[{"name":"Tencent, Shenzhen, China"}]},{"given":"Shengping","family":"Zhou","sequence":"additional","affiliation":[{"name":"Tencent, Shenzhen, China"}]}],"member":"320","published-online":{"date-parts":[[2019,7,25]]},"reference":[{"key":"e_1_3_2_2_1_1","volume-title":"Proc. USENIX Symposium on Operating System Design and Implementation (OSDI) .","author":"Abadi Mart'in","year":"2016"},{"key":"e_1_3_2_2_2_1","volume-title":"Demystifying Parallel and Distributed Deep Learning: An In-Depth Concurrency Analysis. arXiv preprint arXiv:1802.09941","author":"Ben-Nun Tal","year":"2018"},{"key":"e_1_3_2_2_4_1","volume-title":"Parallel coordinate descent for l1-regularized loss minimization. arXiv preprint arXiv:1105.5379","author":"Bradley Joseph K","year":"2011"},{"key":"e_1_3_2_2_5_1","first-page":"571","article-title":"Project Adam: Building an Efficient and Scalable Deep Learning Training System","volume":"14","author":"Chilimbi Trishul M","year":"2014","journal-title":"OSDI"},{"key":"e_1_3_2_2_6_1","volume-title":"et almbox","author":"Dean Jeffrey","year":"2012"},{"key":"e_1_3_2_2_7_1","doi-asserted-by":"publisher","DOI":"10.5555\/2503308.2188391"},{"key":"e_1_3_2_2_8_1","unstructured":"Dua Dheeru and Efi Karra Taniskidou. 2017. UCI Machine Learning Repository. http:\/\/archive.ics.uci.edu\/ml  Dua Dheeru and Efi Karra Taniskidou. 2017. UCI Machine Learning Repository. http:\/\/archive.ics.uci.edu\/ml"},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"publisher","DOI":"10.5555\/1791834.1791836"},{"key":"e_1_3_2_2_10_1","doi-asserted-by":"publisher","DOI":"10.1561\/0400000042"},{"key":"e_1_3_2_2_11_1","volume-title":"International Conference on Machine Learning . 201--210","author":"Gilad-Bachrach Ran","year":"2016"},{"key":"e_1_3_2_2_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/3133956.3134012"},{"key":"e_1_3_2_2_13_1","volume-title":"Phillip B Gibbons, Garth A Gibson, Greg Ganger, and Eric P Xing.","author":"Ho Qirong","year":"2013"},{"key":"e_1_3_2_2_14_1","volume-title":"Gaia: Geo-Distributed Machine Learning Approaching LAN Speeds.. In NSDI. 629--647.","author":"Hsieh Kevin","year":"2017"},{"key":"e_1_3_2_2_15_1","first-page":"2331","article-title":"Slow learners are fast","volume":"22","author":"Langford John","year":"2009","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_2_16_1","volume-title":"Xun Zheng, Qirong Ho, Garth A Gibson, and Eric P Xing.","author":"Lee Seunghak","year":"2014"},{"key":"e_1_3_2_2_17_1","doi-asserted-by":"publisher","DOI":"10.5555\/2685048.2685095"},{"key":"e_1_3_2_2_18_1","unstructured":"Mu Li David G Andersen Alexander J Smola and Kai Yu. 2014b. Communication efficient distributed machine learning with the parameter server. In Advances in Neural Information Processing Systems. 19--27.   Mu Li David G Andersen Alexander J Smola and Kai Yu. 2014b. Communication efficient distributed machine learning with the parameter server. In Advances in Neural Information Processing Systems. 19--27."},{"key":"e_1_3_2_2_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/2835776.2835781"},{"key":"e_1_3_2_2_20_1","unstructured":"Xiangru Lian Yijun Huang Yuncheng Li and Ji Liu. 2015. Asynchronous parallel stochastic gradient for nonconvex optimization. In Advances in Neural Information Processing Systems. 2737--2745.   Xiangru Lian Yijun Huang Yuncheng Li and Ji Liu. 2015. Asynchronous parallel stochastic gradient for nonconvex optimization. In Advances in Neural Information Processing Systems. 2737--2745."},{"key":"e_1_3_2_2_21_1","volume-title":"et almbox","author":"McMahan H Brendan","year":"2016"},{"key":"e_1_3_2_2_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/SP.2017.12"},{"key":"e_1_3_2_2_23_1","unstructured":"Manas Pathak Shantanu Rane and Bhiksha Raj. 2010. Multiparty differential privacy via aggregation of locally trained classifiers. In Advances in Neural Information Processing Systems. 1876--1884.   Manas Pathak Shantanu Rane and Bhiksha Raj. 2010. Multiparty differential privacy via aggregation of locally trained classifiers. In Advances in Neural Information Processing Systems. 1876--1884."},{"key":"e_1_3_2_2_24_1","unstructured":"Arun Rajkumar and Shivani Agarwal. 2012. A differentially private stochastic gradient descent algorithm for multiparty classification. In Artificial Intelligence and Statistics . 933--941.  Arun Rajkumar and Shivani Agarwal. 2012. A differentially private stochastic gradient descent algorithm for multiparty classification. In Artificial Intelligence and Statistics . 933--941."},{"key":"e_1_3_2_2_25_1","volume-title":"Hogwild: A lock-free approach to parallelizing stochastic gradient descent. In Advances in neural information processing systems. 693--701.","author":"Recht Benjamin","year":"2011"},{"key":"e_1_3_2_2_26_1","unstructured":"Chad Scherrer Ambuj Tewari Mahantesh Halappanavar and David Haglin. 2012. Feature clustering for accelerating parallel coordinate descent. In Advances in Neural Information Processing Systems. 28--36.   Chad Scherrer Ambuj Tewari Mahantesh Halappanavar and David Haglin. 2012. Feature clustering for accelerating parallel coordinate descent. In Advances in Neural Information Processing Systems. 28--36."},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/2810103.2813687"},{"key":"e_1_3_2_2_28_1","volume-title":"29th Annual Conference on Neural Information Processing Systems (NIPS) .","author":"Takabi Hassan","year":"2016"},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/1281192.1281275"},{"key":"e_1_3_2_2_30_1","doi-asserted-by":"publisher","DOI":"10.1016\/J.ENG.2016.02.008"},{"key":"e_1_3_2_2_31_1","unstructured":"Yi Zhou Yaoliang Yu Wei Dai Yingbin Liang and Eric Xing. 2016. On convergence of model parallel proximal gradient algorithm for stale synchronous parallel system. In Artificial Intelligence and Statistics . 713--722.  Yi Zhou Yaoliang Yu Wei Dai Yingbin Liang and Eric Xing. 2016. On convergence of model parallel proximal gradient algorithm for stale synchronous parallel system. In Artificial Intelligence and Statistics . 713--722."},{"key":"e_1_3_2_2_32_1","unstructured":"Martin Zinkevich Markus Weimer Lihong Li and Alex J Smola. 2010. Parallelized stochastic gradient descent. In Advances in neural information processing systems. 2595--2603.   Martin Zinkevich Markus Weimer Lihong Li and Alex J Smola. 2010. Parallelized stochastic gradient descent. In Advances in neural information processing systems. 2595--2603."}],"event":{"name":"KDD '19: The 25th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","location":"Anchorage AK USA","acronym":"KDD '19","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data"]},"container-title":["Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery &amp; Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3292500.3330765","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3292500.3330765","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T00:57:51Z","timestamp":1750208271000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3292500.3330765"}},"subtitle":["A Collaborative Machine Learning Framework for Distributed Features"],"short-title":[],"issued":{"date-parts":[[2019,7,25]]},"references-count":31,"alternative-id":["10.1145\/3292500.3330765","10.1145\/3292500"],"URL":"https:\/\/doi.org\/10.1145\/3292500.3330765","relation":{},"subject":[],"published":{"date-parts":[[2019,7,25]]},"assertion":[{"value":"2019-07-25","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}