{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,8]],"date-time":"2025-07-08T17:42:54Z","timestamp":1751996574651,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":26,"publisher":"ACM","license":[{"start":{"date-parts":[[2018,6,22]],"date-time":"2018-06-22T00:00:00Z","timestamp":1529625600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2018,6,22]]},"DOI":"10.1145\/3234664.3234681","type":"proceedings-article","created":{"date-parts":[[2018,10,23]],"date-time":"2018-10-23T12:17:05Z","timestamp":1540297025000},"page":"53-57","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":3,"title":["Performance Comparison of CUDA and OpenACC Based on Optimizations"],"prefix":"10.1145","author":[{"given":"Xuechao","family":"Li","sequence":"first","affiliation":[{"name":"Computer Science Department, Concordia University Chicago, River Forest IL, USA"}]},{"given":"Po-Chou","family":"Shih","sequence":"additional","affiliation":[{"name":"Institute of Industrial and Business Management, National Taipei University of Technology Taipei, Taiwan"}]}],"member":"320","published-online":{"date-parts":[[2018,6,22]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1111\/j.1467-8659.2007.01012.x"},{"key":"e_1_3_2_1_2_1","volume-title":"October","author":"NVIDIA Corporation","year":"2012","unstructured":"NVIDIA Corporation , NVIDIA CUDA C Programming Guide v5.0 , October 2012 . NVIDIA Corporation, NVIDIA CUDA C Programming Guide v5.0, October 2012."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICPP.2011.45"},{"key":"e_1_3_2_1_4_1","unstructured":"The OpenACC Application Programming Interface Version1.0 November 2011.  The OpenACC Application Programming Interface Version1.0 November 2011."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/CCGrid.2013.12"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/SC.Companion.2012.66"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/IISWC.2009.5306797"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/MCSoC.2013.31"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1063\/1.3464228"},{"key":"e_1_3_2_1_10_1","first-page":"51","volume-title":"Evaluating Performance Portability of OpenACC. The 27th International Workshop on Languages and Compilers for Parallel Computing (LCPC)","author":"Amit S.","year":"2014","unstructured":"Amit , S. Putt , S. Seyong , L. and Jeffrey , V . Evaluating Performance Portability of OpenACC. The 27th International Workshop on Languages and Compilers for Parallel Computing (LCPC) , pp. 51 -- 66 , Sept. 2014 Amit, S. Putt, S. Seyong, L. and Jeffrey, V. Evaluating Performance Portability of OpenACC. The 27th International Workshop on Languages and Compilers for Parallel Computing (LCPC), pp. 51--66, Sept. 2014"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/2600212.2600704"},{"key":"e_1_3_2_1_12_1","unstructured":"Kamran K. Neil D. and Firas H. A Performance Comparison of CUDA and OpenCL.  Kamran K. Neil D. and Firas H. A Performance Comparison of CUDA and OpenCL."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.5121\/ijcsea.2016.6501"},{"key":"e_1_3_2_1_14_1","first-page":"448","volume-title":"Long-Sheng Huang and Kuo-Hsuan Wu. Overview and Comparison of OpenCL and CUDA Technology for GPGPU. IEEE Asia Pacific Conference on Circuits and Systems (APCCAS).","author":"Po-Yu Chen","year":"2012","unstructured":"Po-Yu Chen ; Chun-Chieh Lan; Long-Sheng Huang and Kuo-Hsuan Wu. Overview and Comparison of OpenCL and CUDA Technology for GPGPU. IEEE Asia Pacific Conference on Circuits and Systems (APCCAS). pp. 448 -- 451 . Dec. 2012 Po-Yu Chen; Chun-Chieh Lan; Long-Sheng Huang and Kuo-Hsuan Wu. Overview and Comparison of OpenCL and CUDA Technology for GPGPU. IEEE Asia Pacific Conference on Circuits and Systems (APCCAS). pp. 448--451. Dec. 2012"},{"key":"e_1_3_2_1_15_1","first-page":"1","volume-title":"27th International Conference on Architecture of Computing Systems (ARCS).","author":"Christgau S.","year":"2014","unstructured":"Christgau , S. Spazier , J. Schnor , B. Hammitzsch , M. Babeyko , A. and Waechter , J . A comparison of CUDA and OpenACC: Accelerating the Tsunami Simulation EasyWave . 27th International Conference on Architecture of Computing Systems (ARCS). pp. 1 -- 5 . Feb. 2014 Christgau, S. Spazier, J. Schnor, B. Hammitzsch, M. Babeyko, A. and Waechter, J. A comparison of CUDA and OpenACC: Accelerating the Tsunami Simulation EasyWave. 27th International Conference on Architecture of Computing Systems (ARCS). pp. 1--5. Feb. 2014"},{"key":"e_1_3_2_1_16_1","unstructured":"Ruym\u00e1n Reyes Iv\u00e1n L\u00f3pez J Fumero Francisco de Sande. A comparative study of OpenACC implementation. 2012  Ruym\u00e1n Reyes Iv\u00e1n L\u00f3pez J Fumero Francisco de Sande. A comparative study of OpenACC implementation. 2012"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/IISWC.2010.5650274"},{"key":"e_1_3_2_1_18_1","unstructured":"CUDA Education. https:\/\/developer.nvidia.com\/cuda-education  CUDA Education. https:\/\/developer.nvidia.com\/cuda-education"},{"issue":"5","key":"e_1_3_2_1_19_1","volume":"13","author":"Li P-C","year":"2016","unstructured":"X. Li , P-C . Shih , X-Q . Li , C. Seals. A Case Study of Novice Programmers on Parallel Programming Models. Journal of Computers. Vol. 13 , No. 5 , May 2016 . X. Li, P-C. Shih, X-Q. Li, C. Seals. A Case Study of Novice Programmers on Parallel Programming Models. Journal of Computers. Vol.13, No.5, May 2016.","journal-title":"Journal of Computers."},{"key":"e_1_3_2_1_20_1","volume-title":"OpenACC kernels and parallel constructs","author":"Michael W.","year":"2012","unstructured":"Michael , W. OpenACC kernels and parallel constructs . Aug. 2012 Michael, W. OpenACC kernels and parallel constructs. Aug. 2012"},{"key":"e_1_3_2_1_21_1","unstructured":"The OpenACC Application Programming Interface. Version 2.0 Jun. 2013  The OpenACC Application Programming Interface. Version 2.0 Jun. 2013"},{"key":"e_1_3_2_1_22_1","unstructured":"NVIDIA Inc. Parallel Thread Execution ISA Version 4.2 Mar. 2015  NVIDIA Inc. Parallel Thread Execution ISA Version 4.2 Mar. 2015"},{"key":"e_1_3_2_1_23_1","unstructured":"Calvin M Jeffrey O. and Xuechao L. Autotuning OpenACC Work Distribution via Direct Search.To appear at Extreme Science and Engineering Discovery Enviroment (XSEDE15) Jul. 2015  Calvin M Jeffrey O. and Xuechao L. Autotuning OpenACC Work Distribution via Direct Search.To appear at Extreme Science and Engineering Discovery Enviroment (XSEDE15) Jul. 2015"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLC.2011.6017014"},{"key":"e_1_3_2_1_26_1","unstructured":"http:\/\/aqua.dwavesys.com  http:\/\/aqua.dwavesys.com"},{"key":"e_1_3_2_1_27_1","unstructured":"NVIDIA Inc. Profiler Users Guide. Version 4.0 Mar. 2015  NVIDIA Inc. Profiler Users Guide. Version 4.0 Mar. 2015"}],"event":{"name":"HPCCT 2018: 2018 2nd High Performance Computing and Cluster Technologies Conference","sponsor":["Shanghai Jiao Tong University Shanghai Jiao Tong University","Xi'an Jiaotong-Liverpool University Xi'an Jiaotong-Liverpool University","Chinese Academy of Sciences"],"location":"Beijing China","acronym":"HPCCT 2018"},"container-title":["Proceedings of the 2018 2nd High Performance Computing and Cluster Technologies Conference"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3234664.3234681","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3234664.3234681","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T00:57:48Z","timestamp":1750208268000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3234664.3234681"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,6,22]]},"references-count":26,"alternative-id":["10.1145\/3234664.3234681","10.1145\/3234664"],"URL":"https:\/\/doi.org\/10.1145\/3234664.3234681","relation":{},"subject":[],"published":{"date-parts":[[2018,6,22]]},"assertion":[{"value":"2018-06-22","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}