{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,4,2]],"date-time":"2025-04-02T05:40:06Z","timestamp":1743572406753,"version":"3.40.3"},"publisher-location":"Cham","reference-count":25,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031856990","type":"print"},{"value":"9783031857003","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-85700-3_14","type":"book-chapter","created":{"date-parts":[[2025,4,2]],"date-time":"2025-04-02T05:01:34Z","timestamp":1743570094000},"page":"193-206","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Boosting GPGPU Virtualization and\u00a0Multiplexing with\u00a0RDMA Communication"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-7883-4931","authenticated-orcid":false,"given":"Mariano","family":"Aponte","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9545-9978","authenticated-orcid":false,"given":"Gennaro","family":"Mellone","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3828-0170","authenticated-orcid":false,"given":"Ciro Giuseppe","family":"De Vita","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0810-2250","authenticated-orcid":false,"given":"Giuseppe","family":"Salvi","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6119-2099","authenticated-orcid":false,"given":"Nikhil B.","family":"Gaikwad","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9441-4508","authenticated-orcid":false,"given":"Sokol","family":"Kosta","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,4,1]]},"reference":[{"key":"14_CR1","doi-asserted-by":"crossref","unstructured":"Antunes, B.A., Hill, D.R.: Reproducibility, replicability, and repeatability: a survey of reproducible research with a focus on high performance computing. arXiv preprint arXiv:2402.07530 (2024)","DOI":"10.1016\/j.cosrev.2024.100655"},{"key":"14_CR2","doi-asserted-by":"crossref","unstructured":"Boccia, V., Carracciuolo, L., Laccetti, G., Lapegna, M., Mele, V.: Hadab: enabling fault tolerance in parallel applications running in distributed environments. In: Parallel Processing and Applied Mathematics: 9th International Conference, PPAM 2011, Torun, Poland, 11\u201314 September 2011. Revised Selected Papers, Part I 9, pp. 700\u2013709. Springer, Cham (2012)","DOI":"10.1007\/978-3-642-31464-3_71"},{"key":"14_CR3","doi-asserted-by":"crossref","unstructured":"Di\u00a0Lauro, R., Giannone, F., Ambrosio, L., Montella, R.: Virtualizing general purpose GPUs for high performance cloud computing: an application to a fluid simulator. In: 2012 IEEE 10th International Symposium on Parallel and Distributed Processing with Applications, pp. 863\u2013864. IEEE (2012)","DOI":"10.1109\/ISPA.2012.136"},{"key":"14_CR4","doi-asserted-by":"publisher","unstructured":"Frey, P.W., Alonso, G.: Minimizing the hidden cost of RDMA. In: 2009 29th IEEE International Conference on Distributed Computing Systems, pp. 553\u2013560 (2009). https:\/\/doi.org\/10.1109\/ICDCS.2009.32","DOI":"10.1109\/ICDCS.2009.32"},{"key":"14_CR5","doi-asserted-by":"publisher","unstructured":"Giunta, G., Montella, R., Agrillo, G., Coviello, G.: A GPGPU transparent virtualization component for high performance computing clouds. In: D\u2019Ambra, P., Guarracino, M., Talia, D. (eds.) Euro-Par 2010. LNCS, vol. 6271, pp. 379\u2013391. Springer, Heidelberg (2010). https:\/\/doi.org\/10.1007\/978-3-642-15277-1_37","DOI":"10.1007\/978-3-642-15277-1_37"},{"key":"14_CR6","doi-asserted-by":"crossref","unstructured":"Gupta, V., et al.: GVIM: GPU-accelerated virtual machines. In: Proceedings of the 3rd ACM Workshop on System-Level Virtualization for High Performance Computing. HPCVirt \u201909, pp. 17\u201324. Association for Computing Machinery, New York, NY, USA (2009)","DOI":"10.1145\/1519138.1519141"},{"key":"14_CR7","unstructured":"Kawai, A., Yasuoka, K., Yoshikawa, K., Narumi, T.: Distributed-shared CUDA: virtualization of large-scale GPU systems for programmability and reliability. In: FUTURE COMPUTING 2012, The Fourth International Conference on Future Computational Technologies and Applications, pp. 7\u201312 (2012)"},{"key":"14_CR8","doi-asserted-by":"crossref","unstructured":"Laccetti, G., Montella, R., Palmieri, C., Pelliccia, V.: The high performance internet of things: using GVIRTUS to share high-end GPUs with arm based cluster computing nodes. In: International Conference on Parallel Processing and Applied Mathematics, pp. 734\u2013744. Springer, Cham (2013)","DOI":"10.1007\/978-3-642-55224-3_69"},{"key":"14_CR9","doi-asserted-by":"crossref","unstructured":"Marcellino, L., et al.: Using GPGPU accelerated interpolation algorithms for marine bathymetry processing with on-premises and cloud based computational resources. In: International Conference on Parallel Processing and Applied Mathematics, pp. 14\u201324. Springer, Cham (2017)","DOI":"10.1007\/978-3-319-78054-2_2"},{"key":"14_CR10","doi-asserted-by":"crossref","unstructured":"Mentone, A., Di\u00a0Luccio, D., Landolfi, L., Kosta, S., Montella, R.: CUDA virtualization and remoting for GPGPU based acceleration offloading at the edge. In: International Conference on Internet and Distributed Computing Systems, pp. 414\u2013423. Springer, Cham (2019)","DOI":"10.1007\/978-3-030-34914-1_39"},{"key":"14_CR11","doi-asserted-by":"crossref","unstructured":"Montella, R., Coviello, G., Giunta, G., Laccetti, G., Isaila, F., Blas, J.G.: A general-purpose virtualization service for HPC on cloud computing: an application to GPUs. In: Parallel Processing and Applied Mathematics: 9th International Conference, PPAM 2011, Torun, Poland, 11\u201314 September 2011. Revised Selected Papers, Part I 9, pp. 740\u2013749. Springer, Heidelberg (2012)","DOI":"10.1007\/978-3-642-31464-3_75"},{"key":"14_CR12","doi-asserted-by":"crossref","unstructured":"Montella, R., et al.: Enabling the CUDA unified memory model in edge, cloud and HPC offloaded GPU kernels. In: 2022 22nd IEEE International Symposium on Cluster, Cloud and Internet Computing (CCGrid), pp. 834\u2013841. IEEE (2022)","DOI":"10.1109\/CCGrid54584.2022.00099"},{"key":"14_CR13","doi-asserted-by":"crossref","unstructured":"Montella, R., Ferraro, C., Kosta, S., Pelliccia, V., Giunta, G.: Enabling android-based devices to high-end GPGPUs. In: Algorithms and Architectures for Parallel Processing: 16th International Conference, ICA3PP 2016, Granada, Spain, 14\u201316 December 2016, Proceedings 15, pp. 118\u2013125. Springer, Cham (2016)","DOI":"10.1007\/978-3-319-49583-5_9"},{"key":"14_CR14","doi-asserted-by":"crossref","first-page":"139","DOI":"10.1007\/s10586-013-0341-0","volume":"17","author":"R Montella","year":"2014","unstructured":"Montella, R., Giunta, G., Laccetti, G.: Virtualizing high-end GPGPUs on arm clusters for the next generation of high performance cloud computing. Clust. Comput. 17, 139\u2013152 (2014)","journal-title":"Clust. Comput."},{"key":"14_CR15","unstructured":"Montella, R., et al.: Virtualizing CUDA enabled GPGPUs on arm clusters. In: Parallel Processing and Applied Mathematics: 11th International Conference, PPAM 2015, Krakow, Poland, 6\u20139 September 2015. Revised Selected Papers, Part II, pp. 3\u201314. Springer, Cham (2016)"},{"key":"14_CR16","doi-asserted-by":"crossref","first-page":"1142","DOI":"10.1007\/s10766-016-0462-1","volume":"45","author":"R Montella","year":"2017","unstructured":"Montella, R., et al.: On the virtualization of CUDA based GPU remoting on arm and x86 machines in the GVIRTUS framework. Int. J. Parallel Prog. 45, 1142\u20131163 (2017)","journal-title":"Int. J. Parallel Prog."},{"issue":"24","key":"14_CR17","doi-asserted-by":"crossref","DOI":"10.1002\/cpe.4286","volume":"29","author":"R Montella","year":"2017","unstructured":"Montella, R., et al.: Accelerating Linux and android applications on low-power devices through remote GPGPU offloading. Concurr. Compu. Pract. Exp. 29(24), e4286 (2017)","journal-title":"Concurr. Compu. Pract. Exp."},{"issue":"24","key":"14_CR18","doi-asserted-by":"crossref","DOI":"10.1002\/cpe.4895","volume":"30","author":"R Montella","year":"2018","unstructured":"Montella, R., et al.: Marine bathymetry processing through GPGPU virtualization in high performance cloud computing. Concurr. Compu. Pract. Exp. 30(24), e4895 (2018)","journal-title":"Concurr. Compu. Pract. Exp."},{"issue":"15","key":"14_CR19","doi-asserted-by":"crossref","first-page":"2053","DOI":"10.1002\/cpe.1548","volume":"22","author":"A Murli","year":"2010","unstructured":"Murli, A., D\u2019Amore, L., Laccetti, G., Gregoretti, F., Oliva, G.: A multi-grained distributed implementation of the parallel block conjugate gradient algorithm. Concurr. Compu. Pract. Exp. 22(15), 2053\u20132072 (2010)","journal-title":"Concurr. Compu. Pract. Exp."},{"key":"14_CR20","doi-asserted-by":"publisher","unstructured":"Pham, Q., Malik, T., Foster, I., Di Lauro, R., Montella, R.: SOLE: linking research papers with science objects. In: Groth, P., Frew, J. (eds.) IPAW 2012. LNCS, vol. 7525, pp. 203\u2013208. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-34222-6_16","DOI":"10.1007\/978-3-642-34222-6_16"},{"key":"14_CR21","doi-asserted-by":"crossref","unstructured":"Rea\u00f1o, C., et al.: Poster: boosting the performance of remote GPU virtualization using infiniband connect-IB and PCIE 3.0. In: 2014 IEEE International Conference on Cluster Computing (CLUSTER), pp. 266\u2013267 (2014)","DOI":"10.1109\/CLUSTER.2014.6968737"},{"key":"14_CR22","doi-asserted-by":"crossref","first-page":"695","DOI":"10.1016\/j.future.2020.06.027","volume":"112","author":"D Romano","year":"2020","unstructured":"Romano, D., Lapegna, M., Mele, V., Laccetti, G.: Designing a GPU-parallel algorithm for raw SAR data compression: a focus on parallel performance estimation. Futur. Gener. Comput. Syst. 112, 695\u2013708 (2020)","journal-title":"Futur. Gener. Comput. Syst."},{"key":"14_CR23","doi-asserted-by":"crossref","first-page":"187","DOI":"10.1016\/j.future.2021.03.017","volume":"122","author":"DD S\u00e1nchez-Gallegos","year":"2021","unstructured":"S\u00e1nchez-Gallegos, D.D., Di Luccio, D., Kosta, S., Gonzalez-Compean, J., Montella, R.: An efficient pattern-based approach for workflow supporting large-scale science: the dagonstar experience. Futur. Gener. Comput. Syst. 122, 187\u2013203 (2021)","journal-title":"Futur. Gener. Comput. Syst."},{"key":"14_CR24","doi-asserted-by":"crossref","unstructured":"Shi, L., Chen, H., Sun, J., Li, K.: vCUDA: GPU accelerated high performance computing in virtual machines. In: 2009 IEEE International Symposium on Parallel and Distributed Processing, pp. 1\u201311 (2009)","DOI":"10.1109\/IPDPS.2009.5161020"},{"key":"14_CR25","doi-asserted-by":"crossref","unstructured":"Silla, F., Iserte, S., Rea\u00f1o, C., Prades, J.: On the benefits of the remote GPU virtualization mechanism: The rCUDA case. Concurr. Comput. Pract. Exp. 29(13), e4072 (2017)","DOI":"10.1002\/cpe.4072"}],"container-title":["Lecture Notes in Computer Science","Parallel Processing and Applied Mathematics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-85700-3_14","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,2]],"date-time":"2025-04-02T05:02:03Z","timestamp":1743570123000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-85700-3_14"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031856990","9783031857003"],"references-count":25,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-85700-3_14","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"1 April 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"PPAM","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Parallel Processing and Applied Mathematics","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Ostrava","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Czech Republic","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"9 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"12 September 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ppam2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/ppam.edu.pl\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}