{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,10]],"date-time":"2026-01-10T07:35:40Z","timestamp":1768030540818,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":28,"publisher":"ACM","license":[{"start":{"date-parts":[[2017,11,12]],"date-time":"2017-11-12T00:00:00Z","timestamp":1510444800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2017,11,12]]},"DOI":"10.1145\/3126908.3126954","type":"proceedings-article","created":{"date-parts":[[2017,11,8]],"date-time":"2017-11-08T21:02:30Z","timestamp":1510174950000},"page":"1-11","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":36,"title":["Scalable reduction collectives with data partitioning-based multi-leader design"],"prefix":"10.1145","author":[{"given":"Mohammadreza","family":"Bayatpour","sequence":"first","affiliation":[{"name":"The Ohio State University"}]},{"given":"Sourav","family":"Chakraborty","sequence":"additional","affiliation":[{"name":"The Ohio State University"}]},{"given":"Hari","family":"Subramoni","sequence":"additional","affiliation":[{"name":"The Ohio State University"}]},{"given":"Xiaoyi","family":"Lu","sequence":"additional","affiliation":[{"name":"The Ohio State University"}]},{"given":"Dhabaleswar K. (DK)","family":"Panda","sequence":"additional","affiliation":[{"name":"The Ohio State University"}]}],"member":"320","published-online":{"date-parts":[[2017,11,12]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"Mantevo Applications. http:\/\/mantevo.org\/packages\/  Mantevo Applications. http:\/\/mantevo.org\/packages\/"},{"key":"e_1_3_2_1_2_1","unstructured":"2015. The High Performance Conjugate Gradients Benchmark. (2015). http:\/\/hpcg-benchmark.org\/  2015. The High Performance Conjugate Gradients Benchmark. (2015). http:\/\/hpcg-benchmark.org\/"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/215399.215427"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/2966884.2966912"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/HOTI.2015.22"},{"key":"e_1_3_2_1_6_1","volume-title":"Open Source High Performance Computing","author":"Open","year":"2017","unstructured":"Open MPI : Open Source High Performance Computing . 2017 . http:\/\/www.open-mpi.org. (2017). Open MPI: Open Source High Performance Computing. 2017. http:\/\/www.open-mpi.org. (2017)."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/155332.155333"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.5555\/3018058.3018059"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-8191(06)80021-9"},{"key":"e_1_3_2_1_10_1","unstructured":"IB 2017. InfiniBand Trade Association. http:\/\/www.infinibandta.com. (2017).  IB 2017. InfiniBand Trade Association. http:\/\/www.infinibandta.com. (2017)."},{"key":"e_1_3_2_1_11_1","unstructured":"J. Liu and W. Jiang and P. Wyckoff and D. K. Panda and D. Ashton and D. Buntinas and B. Gropp and B. Tooney. 2004. High Performance Implementation of MPICH2 over InfiniBand with RDMA Support. In IPDPS.  J. Liu and W. Jiang and P. Wyckoff and D. K. Panda and D. Ashton and D. Buntinas and B. Gropp and B. Tooney. 2004. High Performance Implementation of MPICH2 over InfiniBand with RDMA Support. In IPDPS."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00450-011-0170-4"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2012.106"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.5555\/645612.662667"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10586-014-0361-4"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/2493123.2462903"},{"key":"e_1_3_2_1_17_1","volume-title":"Proceedings of Int'l Parallel and Distributed Processing Symposium (IPDPS '04)","author":"Liu J.","unstructured":"J. Liu , W. Jiang , P. Wyckoff , D. K. Panda , D. Ashton , D. Buntinas , W. Gropp , and B. Toonen . 2004. Design and Implementation of MPICH2 over InfiniBand with RDMA Support . In Proceedings of Int'l Parallel and Distributed Processing Symposium (IPDPS '04) . J. Liu, W. Jiang, P. Wyckoff, D. K. Panda, D. Ashton, D. Buntinas, W. Gropp, and B. Toonen. 2004. Design and Implementation of MPICH2 over InfiniBand with RDMA Support. In Proceedings of Int'l Parallel and Distributed Processing Symposium (IPDPS '04)."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2011.221"},{"key":"e_1_3_2_1_19_1","unstructured":"Message Passing Interface Forum 1994. MPI: A Message-Passing Interface Standard. Message Passing Interface Forum.  Message Passing Interface Forum 1994. MPI: A Message-Passing Interface Standard. Message Passing Interface Forum."},{"key":"e_1_3_2_1_20_1","unstructured":"OSU Micro-Benchmarks. 2017. http:\/\/mvapich.cse.ohio-state.edu\/benchmarks. (2017).  OSU Micro-Benchmarks. 2017. http:\/\/mvapich.cse.ohio-state.edu\/benchmarks. (2017)."},{"key":"e_1_3_2_1_21_1","unstructured":"MPI3 2012. MPI-3 Standard Document. http:\/\/www.mpi-forum.org\/docs\/mpi-3.0\/mpi30-report.pdf. (2012).  MPI3 2012. MPI-3 Standard Document. http:\/\/www.mpi-forum.org\/docs\/mpi-3.0\/mpi30-report.pdf. (2012)."},{"key":"e_1_3_2_1_22_1","unstructured":"MVAPICH2 2017. MVAPICH: MPI over InfiniBand Omni-Path Ethernet\/iWARP and RoCE. http:\/\/mvapich.cse.ohio-state.edu\/. (2017).  MVAPICH2 2017. MVAPICH: MPI over InfiniBand Omni-Path Ethernet\/iWARP and RoCE. http:\/\/mvapich.cse.ohio-state.edu\/. (2017)."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2005.335"},{"key":"e_1_3_2_1_24_1","volume-title":"Proceedings of the message passing interface developerfis and userfis conference","volume":"1999","author":"Rabenseifner Rolf","year":"1999","unstructured":"Rolf Rabenseifner . 1999 . Automatic MPI Counter Profiling of all Users: First Results on a CRAY T3E 900-512 . In Proceedings of the message passing interface developerfis and userfis conference , Vol. 1999 . 77--85. Rolf Rabenseifner. 1999. Automatic MPI Counter Profiling of all Users: First Results on a CRAY T3E 900-512. In Proceedings of the message passing interface developerfis and userfis conference, Vol. 1999. 77--85."},{"key":"e_1_3_2_1_25_1","volume-title":"Optimization of Collective Reduction Operations. In International Conference on Computational Science. Springer, 1--9.","author":"Rabenseifner Rolf","year":"2004","unstructured":"Rolf Rabenseifner . 2004 . Optimization of Collective Reduction Operations. In International Conference on Computational Science. Springer, 1--9. Rolf Rabenseifner. 2004. Optimization of Collective Reduction Operations. In International Conference on Computational Science. Springer, 1--9."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1177\/1094342005051521"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/HiPC.2014.7116876"},{"key":"e_1_3_2_1_28_1","volume-title":"(DK) Panda","author":"Zhang Jie","year":"2014","unstructured":"Jie Zhang , Xiaoyi Lu , Jithin Jose , Rong Shi , and Dhabaleswar K . (DK) Panda . 2014 . Can Inter-VM Shmem Benefit MPI Applications on SR-IOV Based Virtualized Infiniband Clusters? Springer International Publishing , Cham, 342--353. Jie Zhang, Xiaoyi Lu, Jithin Jose, Rong Shi, and Dhabaleswar K. (DK) Panda. 2014. Can Inter-VM Shmem Benefit MPI Applications on SR-IOV Based Virtualized Infiniband Clusters? Springer International Publishing, Cham, 342--353."}],"event":{"name":"SC '17: The International Conference for High Performance Computing, Networking, Storage and Analysis","location":"Denver Colorado","acronym":"SC '17","sponsor":["SIGHPC ACM Special Interest Group on High Performance Computing, Special Interest Group on High Performance Computing","IEEE CS"]},"container-title":["Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3126908.3126954","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3126908.3126954","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T02:11:08Z","timestamp":1750212668000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3126908.3126954"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,11,12]]},"references-count":28,"alternative-id":["10.1145\/3126908.3126954","10.1145\/3126908"],"URL":"https:\/\/doi.org\/10.1145\/3126908.3126954","relation":{},"subject":[],"published":{"date-parts":[[2017,11,12]]},"assertion":[{"value":"2017-11-12","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}