{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T23:30:02Z","timestamp":1777937402293,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":14,"publisher":"ACM","license":[{"start":{"date-parts":[[2016,6,1]],"date-time":"2016-06-01T00:00:00Z","timestamp":1464739200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2016,6]]},"DOI":"10.1145\/2931088.2931091","type":"proceedings-article","created":{"date-parts":[[2016,5,25]],"date-time":"2016-05-25T20:14:10Z","timestamp":1464207250000},"page":"1-8","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":39,"title":["GPUrdma"],"prefix":"10.1145","author":[{"given":"Feras","family":"Daoud","sequence":"first","affiliation":[{"name":"Technion - Israel Institute of Technology"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Amir","family":"Watad","sequence":"additional","affiliation":[{"name":"Technion - Israel Institute of Technology"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mark","family":"Silberstein","sequence":"additional","affiliation":[{"name":"Technion - Israel Institute of Technology"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2016,6]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"GPI-2. http:\/\/www.gpi-site.com\/gpi2\/.  GPI-2. http:\/\/www.gpi-site.com\/gpi2\/."},{"key":"e_1_3_2_1_2_1","unstructured":"GPUDirectRDMA technology. http:\/\/docs.nvidia.com\/cuda\/gpudirect-rdma\/index.html.  GPUDirectRDMA technology. http:\/\/docs.nvidia.com\/cuda\/gpudirect-rdma\/index.html."},{"key":"e_1_3_2_1_3_1","unstructured":"MVAPICH2: High performance MPI over InfiniBand iWARP and RoCE. http:\/\/mvapich.cse.ohio-state.edu.  MVAPICH2: High performance MPI over InfiniBand iWARP and RoCE. http:\/\/mvapich.cse.ohio-state.edu."},{"key":"e_1_3_2_1_4_1","unstructured":"OpenFabrics Enterprise Distribution. https:\/\/www.openfabrics.org\/index.php\/openfabrics-software.html.  OpenFabrics Enterprise Distribution. https:\/\/www.openfabrics.org\/index.php\/openfabrics-software.html."},{"key":"e_1_3_2_1_5_1","first-page":"201","volume-title":"11th USENIX Symposium on Operating Systems Design and Implementation (OSDI 14)","author":"Kim Sangman","year":"2014"},{"key":"e_1_3_2_1_6_1","volume-title":"Newnes","author":"Kirk David B","year":"2012"},{"key":"e_1_3_2_1_7_1","volume-title":"International Journal of High Performance Computing Applications, page 8","author":"Oden Lena","year":"2015"},{"key":"e_1_3_2_1_8_1","first-page":"693","volume-title":"Advances in Neural Information Processing Systems","author":"Recht Benjamin","year":"2011"},{"key":"e_1_3_2_1_9_1","unstructured":"Davide Rossetti. GPUDirect async: integrating the GPU with a network interface.  Davide Rossetti. GPUDirect async: integrating the GPU with a network interface."},{"key":"e_1_3_2_1_10_1","volume-title":"Mark Silberstein. ActivePointers: A Case For Software Translation on GPUs. In Proceedings of the ACM IEEE International Symposium on Computer Architecture (ISCA). IEEE","author":"Shahar Sagi","year":"2016"},{"key":"e_1_3_2_1_11_1","volume-title":"GPUfs. In ACM International Conference on Systems and Storage (SYSTOR). ACM","author":"Shahar Sagi","year":"2016"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/2451116.2451169"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/2553081"},{"key":"e_1_3_2_1_14_1","unstructured":"https:\/\/github.com\/NVIDIA\/nccl. NCCL: optimized primitives for collective multi-GPU communication.  https:\/\/github.com\/NVIDIA\/nccl. NCCL: optimized primitives for collective multi-GPU communication."}],"event":{"name":"ROSS '16: International Workshop on Runtime and Operating Systems for Supercomputers","location":"Kyoto Japan","acronym":"ROSS '16","sponsor":["SIGHPC ACM Special Interest Group on High Performance Computing, Special Interest Group on High Performance Computing"]},"container-title":["Proceedings of the 6th International Workshop on Runtime and Operating Systems for Supercomputers"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2931088.2931091","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2931088.2931091","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:55:56Z","timestamp":1750222556000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2931088.2931091"}},"subtitle":["GPU-side library for high performance networking from GPU kernels"],"short-title":[],"issued":{"date-parts":[[2016,6]]},"references-count":14,"alternative-id":["10.1145\/2931088.2931091","10.1145\/2931088"],"URL":"https:\/\/doi.org\/10.1145\/2931088.2931091","relation":{},"subject":[],"published":{"date-parts":[[2016,6]]},"assertion":[{"value":"2016-06-01","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}