{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,18]],"date-time":"2026-03-18T09:19:15Z","timestamp":1773825555501,"version":"3.50.1"},"reference-count":34,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2020,1,8]],"date-time":"2020-01-08T00:00:00Z","timestamp":1578441600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,1,8]],"date-time":"2020-01-08T00:00:00Z","timestamp":1578441600000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001459","name":"Ministry of Education - Singapore","doi-asserted-by":"publisher","award":["MOE2017-T2-1-122"],"award-info":[{"award-number":["MOE2017-T2-1-122"]}],"id":[{"id":"10.13039\/501100001459","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Distrib Parallel Databases"],"published-print":{"date-parts":[[2020,12]]},"DOI":"10.1007\/s10619-019-07280-z","type":"journal-article","created":{"date-parts":[[2020,1,8]],"date-time":"2020-01-08T09:02:42Z","timestamp":1578474162000},"page":"771-793","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":10,"title":["Revisiting hash join on graphics processors: a decade later"],"prefix":"10.1007","volume":"38","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3473-2264","authenticated-orcid":false,"given":"Johns","family":"Paul","sequence":"first","affiliation":[]},{"given":"Bingsheng","family":"He","sequence":"additional","affiliation":[]},{"given":"Shengliang","family":"Lu","sequence":"additional","affiliation":[]},{"given":"Chiew Tong","family":"Lau","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,1,8]]},"reference":[{"key":"7280_CR1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-32518-2_3","volume-title":"Towards Optimization of Hybrid CPU\/GPU Query Plans in Database Systems","author":"S Bre\u00df","year":"2013","unstructured":"Bre\u00df, S., Schallehn, E., Geist, I.: Towards Optimization of Hybrid CPU\/GPU Query Plans in Database Systems. Springer, Berlin (2013)"},{"key":"7280_CR2","doi-asserted-by":"crossref","unstructured":"Rauhe, H., Dees, J., Sattler, K.-U., Faerber, F.: Multi-level parallel query execution framework for CPU and GPU. In: Proceedings of the East European Conference on Advances in Databases and Information Systems, pp. 330\u2013343 . Springer, New York (2013)","DOI":"10.1007\/978-3-642-40683-6_25"},{"key":"7280_CR3","doi-asserted-by":"crossref","unstructured":"Wu, H., Diamos, G., Sheard, T., Aref, M., Baxter, S., Garland, M., Yalamanchili, S.: Red fox: an execution environment for relational query processing on gpus. In: Proceedings of Annual IEEE\/ACM International Symposium on Code Generation and Optimization, ACM. p.\u00a044 (2014)","DOI":"10.1145\/2544137.2544166"},{"issue":"11","key":"7280_CR4","doi-asserted-by":"publisher","first-page":"1011","DOI":"10.14778\/2732967.2732976","volume":"7","author":"K Wang","year":"2014","unstructured":"Wang, K., Zhang, K., Yuan, Y., Ma, S., Lee, R., Ding, X., Zhang, X.: Concurrent analytical query processing with gpus. Proc. VLDB Endow. 7(11), 1011\u20131022 (2014)","journal-title":"Proc. VLDB Endow."},{"key":"7280_CR5","doi-asserted-by":"crossref","unstructured":"Pirk, H., Manegold, S., Kersten, M.: Waste not... efficient co-processing of relational data. In: 2014 IEEE 30th International Conference on Data Engineering, pp. 508\u2013519. IEEE (2014)","DOI":"10.1109\/ICDE.2014.6816677"},{"key":"7280_CR6","doi-asserted-by":"crossref","unstructured":"He, B., Yang, K., Fang, R., Lu, M., Govindaraju, N., Luo, Q., Sander, P.: Relational joins on graphics processors. In: Proceedings of the 2008 ACM SIGMOD International Conference on Management of Data, pp. 511\u2013524. ACM (2008)","DOI":"10.1145\/1376616.1376670"},{"issue":"10","key":"7280_CR7","doi-asserted-by":"publisher","first-page":"889","DOI":"10.14778\/2536206.2536216","volume":"6","author":"J He","year":"2013","unstructured":"He, J., Lu, M., He, B.: Revisiting co-processing for hash joins on the coupled cpu-gpu architecture. Proc. VLDB Endow. 6(10), 889\u2013900 (2013)","journal-title":"Proc. VLDB Endow."},{"key":"7280_CR8","doi-asserted-by":"crossref","unstructured":"Rui, R., Li, H., Tu, Y.-C.: Join algorithms on gpus: A revisit after seven years. In: 2015 IEEE International Conference on Big Data (Big Data), pp. 2541\u20132550. IEEE (2015)","DOI":"10.1109\/BigData.2015.7364051"},{"key":"7280_CR9","doi-asserted-by":"crossref","unstructured":"Rui, R., Tu, Y.-C.: Fast equi-join algorithms on gpus: Design and implementation. In: Proceedings of the 29th International Conference on Scientific and Statistical Database Management, p.\u00a017. ACM (2017)","DOI":"10.1145\/3085504.3085521"},{"issue":"9","key":"7280_CR10","doi-asserted-by":"publisher","first-page":"2663","DOI":"10.1109\/TPDS.2017.2677451","volume":"28","author":"M Yabuta","year":"2017","unstructured":"Yabuta, M., Nguyen, A., Kato, S., Edahiro, M., Kawashima, H.: Relational joins on gpus: a closer look. IEEE Trans. Parallel Distrib. Syst. 28(9), 2663\u20132673 (2017)","journal-title":"IEEE Trans. Parallel Distrib. Syst."},{"key":"7280_CR11","doi-asserted-by":"crossref","unstructured":"Kaldewey, T., Lohman, G., Mueller, R., Volk, P.: Gpu join processing revisited. In: Proceedings of the Eighth International Workshop on Data Management on New Hardware, pp. 55\u201362. ACM (2012)","DOI":"10.1145\/2236584.2236592"},{"key":"7280_CR12","doi-asserted-by":"crossref","unstructured":"Wu, H., Diamos, G., Cadambi, S., Yalamanchili, S.: Kernel weaver: Automatically fusing database primitives for efficient gpu computation. In: 2012 45th Annual IEEE\/ACM International Symposium on Microarchitecture, pp. 107\u2013118. IEEE (2012)","DOI":"10.1109\/MICRO.2012.19"},{"issue":"4","key":"7280_CR13","doi-asserted-by":"publisher","first-page":"329","DOI":"10.14778\/2735496.2735497","volume":"8","author":"J He","year":"2014","unstructured":"He, J., Zhang, S., He, B.: In-cache query co-processing on coupled cpu-gpu architectures. Proc. VLDB Endow. 8(4), 329\u2013340 (2014)","journal-title":"Proc. VLDB Endow."},{"key":"7280_CR14","doi-asserted-by":"crossref","unstructured":"Sioulas, P., Chrysogelos, P., Karpathiotakis, M., Appuswamy, R., Ailamaki, A.: Hardware-conscious hash-joins on gpus. In: 2019 IEEE 35th International Conference on Data Engineering (ICDE), pp. 698\u2013709. IEEE (2019)","DOI":"10.1109\/ICDE.2019.00068"},{"key":"7280_CR15","unstructured":"Diamos, G.F., Wu, H., Lele, A., Wang, J.: Efficient relational algebra algorithms and data structures for gpu. Georgia Institute of Technology, Tech. Rep. (2012)"},{"key":"7280_CR16","doi-asserted-by":"crossref","unstructured":"Paul, J., He, B., Lu, S., Lau, C.T.: Revisiting hash join on graphics processors: a decade later. In: 2019 IEEE 35th International Conference on Data Engineering Workshops (ICDEW), pp. 294\u2013299. IEEE (2019)","DOI":"10.1109\/ICDEW.2019.00008"},{"key":"7280_CR17","doi-asserted-by":"crossref","unstructured":"Blanas, S., Li, Y., Patel, J.M.: Design and evaluation of main memory hash join algorithms for multi-core cpus. In: Proceedings of the 2011 ACM SIGMOD International Conference on Management of data, pp. 37\u201348. ACM (2011)","DOI":"10.1145\/1989323.1989328"},{"key":"7280_CR18","doi-asserted-by":"crossref","unstructured":"Balkesen, C., Teubner, J., Alonso, G., \u00d6zsu, M.T.: Main-memory hash joins on multi-core cpus: Tuning to the underlying hardware. In: 2013 IEEE 29th International Conference on Data Engineering (ICDE), pp. 362\u2013373. IEEE (2013)","DOI":"10.1109\/ICDE.2013.6544839"},{"issue":"2","key":"7280_CR19","doi-asserted-by":"publisher","first-page":"1378","DOI":"10.14778\/1687553.1687564","volume":"2","author":"C Kim","year":"2009","unstructured":"Kim, C., Kaldewey, T., Lee, V.W., Sedlar, E., Nguyen, A.D., Satish, N., Chhugani, J., Di Blas, A., Dubey, P.: Sort vs. hash revisited: fast join implementation on modern multi-core cpus. Proc. VLDB Endow. 2(2), 1378\u20131389 (2009)","journal-title":"Proc. VLDB Endow."},{"key":"7280_CR20","first-page":"54","volume":"99","author":"PA Boncz","year":"1999","unstructured":"Boncz, P.A., Manegold, S., Kersten, M.L., et al.: Database architecture optimized for the new bottleneck: memory access. VLDB 99, 54\u201365 (1999)","journal-title":"VLDB"},{"issue":"2","key":"7280_CR21","doi-asserted-by":"publisher","first-page":"8","DOI":"10.1145\/1366102.1366105","volume":"33","author":"B He","year":"2008","unstructured":"He, B., Luo, Q.: Cache-oblivious databases: limitations and opportunities. ACM Trans. Database Syst. 33(2), 8 (2008)","journal-title":"ACM Trans. Database Syst."},{"issue":"3","key":"7280_CR22","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1145\/1272743.1272747","volume":"32","author":"S Chen","year":"2007","unstructured":"Chen, S., Ailamaki, A., Gibbons, P.B., Mowry, T.C.: Improving hash join performance through prefetching. ACM Trans. Database Syst. 32(3), 17 (2007)","journal-title":"ACM Trans. Database Syst."},{"issue":"1","key":"7280_CR23","doi-asserted-by":"publisher","first-page":"85","DOI":"10.14778\/2732219.2732227","volume":"7","author":"C Balkesen","year":"2013","unstructured":"Balkesen, C., Alonso, G., Teubner, J., \u00d6zsu, M.T.: Multi-core, main-memory joins: sort vs. hash revisited. Proc. VLDB Endow. 7(1), 85\u201396 (2013)","journal-title":"Proc. VLDB Endow."},{"issue":"1","key":"7280_CR24","doi-asserted-by":"publisher","first-page":"277","DOI":"10.14778\/1687627.1687659","volume":"2","author":"G Candea","year":"2009","unstructured":"Candea, G., Polyzotis, N., Vingralek, R.: A scalable, predictable join operator for highly concurrent data warehouses. Proc. VLDB Endow. 2(1), 277\u2013288 (2009)","journal-title":"Proc. VLDB Endow."},{"issue":"6","key":"7280_CR25","doi-asserted-by":"publisher","first-page":"480","DOI":"10.14778\/2904121.2904124","volume":"9","author":"D Makreshanski","year":"2016","unstructured":"Makreshanski, D., Giannikis, G., Alonso, G., Kossmann, D.: Mqjoin: efficient shared execution of main-memory joins. Proc. VLDB Endow. 9(6), 480\u2013491 (2016)","journal-title":"Proc. VLDB Endow."},{"issue":"6","key":"7280_CR26","doi-asserted-by":"publisher","first-page":"526","DOI":"10.14778\/2168651.2168654","volume":"5","author":"G Giannikis","year":"2012","unstructured":"Giannikis, G., Alonso, G., Kossmann, D.: Shareddb: killing one thousand queries with one stone. Proc. VLDB Endow. 5(6), 526\u2013537 (2012)","journal-title":"Proc. VLDB Endow."},{"key":"7280_CR27","doi-asserted-by":"crossref","unstructured":"Schuh, S., Chen, X., Dittrich, J.: An experimental comparison of thirteen relational equi-joins in main memory. In: Proceedings of the 2016 International Conference on Management of Data, pp. 1961\u20131976. ACM (2016)","DOI":"10.1145\/2882903.2882917"},{"key":"7280_CR28","doi-asserted-by":"crossref","unstructured":"Arumugam, S., Dobra, A., Jermaine, C.M., Pansare, N., Perez, L.: The datapath system: a data-centric analytic processing engine for large data warehouses. In: Proceedings of the 2010 ACM SIGMOD International Conference on Management of data, pp. 519\u2013530. ACM (2010)","DOI":"10.1145\/1807167.1807224"},{"key":"7280_CR29","doi-asserted-by":"crossref","unstructured":"Harizopoulos, S., Shkapenyuk, V., Ailamaki, A.: Qpipe: a simultaneously pipelined relational query engine. In: Proceedings of the 2005 ACM SIGMOD International Conference on Management of Data, pp. 383\u2013394. ACM (2005)","DOI":"10.1145\/1066157.1066201"},{"key":"7280_CR30","doi-asserted-by":"crossref","unstructured":"Alcantara, D.A., Volkov, V., Sengupta, S., Mitzenmacher, M., Owens, J.D., Amenta, N.: Building an efficient hash table on the gpu. In: GPU Computing Gems Jade Edition. Elsevier, pp. 39\u201353 (2012)","DOI":"10.1016\/B978-0-12-385963-1.00004-6"},{"key":"7280_CR31","unstructured":"Pirk, H., Manegold, S., Kersten, M.: Accelerating foreign-key joins using asymmetric memory channels. In: ADMS (2011)"},{"key":"7280_CR32","doi-asserted-by":"crossref","unstructured":"Gregg, C., Hazelwood, K.: Where is the data? why you cannot debate cpu vs. gpu performance without the answer. In: (IEEE ISPASS) IEEE International Symposium on Performance Analysis of Systems and Software, pp. 134\u2013144. IEEE (2011)","DOI":"10.1109\/ISPASS.2011.5762730"},{"issue":"10","key":"7280_CR33","doi-asserted-by":"publisher","first-page":"817","DOI":"10.14778\/2536206.2536210","volume":"6","author":"Y Yuan","year":"2013","unstructured":"Yuan, Y., Lee, R., Zhang, X.: The yin and yang of processing data warehousing queries on gpu devices. Proc. VLDB Endow. 6(10), 817\u2013828 (2013)","journal-title":"Proc. VLDB Endow."},{"issue":"9","key":"7280_CR34","doi-asserted-by":"publisher","first-page":"709","DOI":"10.14778\/2536360.2536370","volume":"6","author":"M Heimel","year":"2013","unstructured":"Heimel, M., Saecker, M., Pirk, H., Manegold, S., Markl, V.: Hardware-oblivious parallelism for in-memory column-stores. Proc. VLDB Endow. 6(9), 709\u2013720 (2013)","journal-title":"Proc. VLDB Endow."}],"container-title":["Distributed and Parallel Databases"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10619-019-07280-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10619-019-07280-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10619-019-07280-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,1,7]],"date-time":"2021-01-07T00:56:39Z","timestamp":1609980999000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10619-019-07280-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,1,8]]},"references-count":34,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2020,12]]}},"alternative-id":["7280"],"URL":"https:\/\/doi.org\/10.1007\/s10619-019-07280-z","relation":{},"ISSN":["0926-8782","1573-7578"],"issn-type":[{"value":"0926-8782","type":"print"},{"value":"1573-7578","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,1,8]]},"assertion":[{"value":"8 January 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}