{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,10]],"date-time":"2026-01-10T07:38:03Z","timestamp":1768030683988,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":23,"publisher":"ACM","license":[{"start":{"date-parts":[[2018,6,20]],"date-time":"2018-06-20T00:00:00Z","timestamp":1529452800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["CNS-1405695 , CCF- 1618303\/7960"],"award-info":[{"award-number":["CNS-1405695 , CCF- 1618303\/7960"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2018,6,20]]},"DOI":"10.1145\/3241793.3241800","type":"proceedings-article","created":{"date-parts":[[2018,10,2]],"date-time":"2018-10-02T12:09:29Z","timestamp":1538482169000},"page":"1-6","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":23,"title":["FPGA HPC using OpenCL"],"prefix":"10.1145","author":[{"given":"Ahmed","family":"Sanaullah","sequence":"first","affiliation":[{"name":"Department of Electrical and Computer Engineering; Boston University, Boston, MA"}]},{"given":"Martin C.","family":"Herbordt","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering; Boston University, Boston, MA"}]}],"member":"320","published-online":{"date-parts":[[2018,6,20]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/1862648.1862653"},{"key":"e_1_3_2_1_2_1","volume-title":"Real-Time Data Analysis for Medical Diagnosis Using FPGA-Accelerated Neural Networks,\" BMC Bioinformatics","author":"Sanaullah A.","year":"2018","unstructured":"A. Sanaullah , C. Yang , Y. Alexeev , K. Yoshii , and M. C. Herbordt , \" Real-Time Data Analysis for Medical Diagnosis Using FPGA-Accelerated Neural Networks,\" BMC Bioinformatics , 2018 . A. Sanaullah, C. Yang, Y. Alexeev, K. Yoshii, and M. C. Herbordt, \"Real-Time Data Analysis for Medical Diagnosis Using FPGA-Accelerated Neural Networks,\" BMC Bioinformatics, 2018."},{"key":"e_1_3_2_1_3_1","first-page":"192","author":"Sanaullah A.","year":"2016","unstructured":"A. Sanaullah , A. Khoshparvar , and M. C. Herbordt , \"FPGA-Accelerated Particle-Grid Mapping,\" in Field-Programmable Custom Computing Machines , 2016 , pp. 192 -- 195 . A. Sanaullah, A. Khoshparvar, and M. C. Herbordt, \"FPGA-Accelerated Particle-Grid Mapping,\" in Field-Programmable Custom Computing Machines, 2016, pp. 192--195.","journal-title":"\"FPGA-Accelerated Particle-Grid Mapping,\" in Field-Programmable Custom Computing Machines"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-30117-2_90"},{"key":"e_1_3_2_1_5_1","first-page":"341","volume-title":"IEEE Conf. on Field Programmable Logic and Applications","author":"Sukhwani B.","year":"2008","unstructured":"B. Sukhwani and M. Herbordt , \" Acceleration of a Production Rigid Molecule Docking Code,\" in Proc . IEEE Conf. on Field Programmable Logic and Applications , 2008 , pp. 341 -- 346 . B. Sukhwani and M. Herbordt, \"Acceleration of a Production Rigid Molecule Docking Code,\" in Proc. IEEE Conf. on Field Programmable Logic and Applications, 2008, pp. 341--346."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1049\/iet-cdt.2009.0013"},{"key":"e_1_3_2_1_7_1","volume-title":"An FPGA Implementation of the Smooth Particle Mesh Ewald Reciprocal Sum Compute Engine (RSCE)","author":"Lee S.","year":"2005","unstructured":"S. Lee , An FPGA Implementation of the Smooth Particle Mesh Ewald Reciprocal Sum Compute Engine (RSCE) . University of Toronto , 2005 . S. Lee, An FPGA Implementation of the Smooth Particle Mesh Ewald Reciprocal Sum Compute Engine (RSCE). University of Toronto, 2005."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCSI.2010.2078750"},{"key":"e_1_3_2_1_9_1","first-page":"1238","author":"Andrade J.","year":"2013","unstructured":"J. Andrade , V. M. M. da Silva , and G. F. P. Fernandes , \" From OpenCL to Gates: The FFT.\" in GlobalSIP , 2013 , pp. 1238 -- 1241 . J. Andrade, V. M. M. da Silva, and G. F. P. Fernandes, \"From OpenCL to Gates: The FFT.\" in GlobalSIP, 2013, pp. 1238--1241.","journal-title":"GlobalSIP"},{"key":"e_1_3_2_1_10_1","first-page":"68","volume-title":"Int. Symp. Field-Programmable Custom Computing Machines. IEEE","author":"Humphries B.","year":"2014","unstructured":"B. Humphries , H. Zhang , J. Sheng , R. Landaverde , and M. C. Herbordt , \" 3D FFTs on a Single FPGA,\" in Proc . Int. Symp. Field-Programmable Custom Computing Machines. IEEE , 2014 , pp. 68 -- 71 . B. Humphries, H. Zhang, J. Sheng, R. Landaverde, and M. C. Herbordt, \"3D FFTs on a Single FPGA,\" in Proc. Int. Symp. Field-Programmable Custom Computing Machines. IEEE, 2014, pp. 68--71."},{"key":"e_1_3_2_1_11_1","first-page":"1","volume-title":"2014 IEEE. IEEE","author":"Sheng J.","year":"2014","unstructured":"J. Sheng , B. Humphries , H. Zhang , and M. C. Herbordt , \" Design of 3D FFTs with FPGA clusters,\" in High Performance Extreme Computing Conference (HPEC) , 2014 IEEE. IEEE , 2014 , pp. 1 -- 6 . J. Sheng, B. Humphries, H. Zhang, and M. C. Herbordt, \"Design of 3D FFTs with FPGA clusters,\" in High Performance Extreme Computing Conference (HPEC), 2014 IEEE. IEEE, 2014, pp. 1--6."},{"key":"e_1_3_2_1_12_1","volume-title":"Highly Efficient and Reconfigurable Technologies","author":"Sheng J.","year":"2015","unstructured":"J. Sheng , C. Yang , and M. Herbordt , \" Towards Low-Latency Communication on FPGA Clusters with 3D FFT Case Study,\" Proc . Highly Efficient and Reconfigurable Technologies , 2015 . J. Sheng, C. Yang, and M. Herbordt, \"Towards Low-Latency Communication on FPGA Clusters with 3D FFT Case Study,\" Proc. Highly Efficient and Reconfigurable Technologies, 2015."},{"key":"e_1_3_2_1_13_1","first-page":"1","volume-title":"HPC on FPGA Clouds: 3D FFTs and Implications for Molecular Dynamics,\" in Proc Field Programmable Logic and Applications","author":"Sheng J.","year":"2017","unstructured":"J. Sheng , C. Yang , A. Sanaullah , M. Papamichael , A. Caulfield , and M. C. Herbordt , \" HPC on FPGA Clouds: 3D FFTs and Implications for Molecular Dynamics,\" in Proc Field Programmable Logic and Applications , 2017 , pp. 1 -- 4 . J. Sheng, C. Yang, A. Sanaullah, M. Papamichael, A. Caulfield, and M. C. Herbordt, \"HPC on FPGA Clouds: 3D FFTs and Implications for Molecular Dynamics,\" in Proc Field Programmable Logic and Applications, 2017, pp. 1--4."},{"key":"e_1_3_2_1_14_1","unstructured":"Intel \"Intel FPGA SDK for OpenCL \" https:\/\/www.altera.com\/products\/design-software\/embedded-software-developers\/opencl\/developer-zone.html accessed: 2017-01-16.  Intel \"Intel FPGA SDK for OpenCL \" https:\/\/www.altera.com\/products\/design-software\/embedded-software-developers\/opencl\/developer-zone.html accessed: 2017-01-16."},{"key":"e_1_3_2_1_15_1","first-page":"409","volume-title":"Conf. for High Performance Computing, Networking, Storage and Analysis, SC16","author":"Zohouri H. R.","year":"2016","unstructured":"H. R. Zohouri , N. Maruyamay , A. Smith , M. Matsuda , and S. Matsuoka , \" Evaluating and Optimizing OpenCL Kernels for High Performance Computing with FPGAs,\" in Int . Conf. for High Performance Computing, Networking, Storage and Analysis, SC16 , 2016 , pp. 409 -- 420 . H. R. Zohouri, N. Maruyamay, A. Smith, M. Matsuda, and S. Matsuoka, \"Evaluating and Optimizing OpenCL Kernels for High Performance Computing with FPGAs,\" in Int. Conf. for High Performance Computing, Networking, Storage and Analysis, SC16, 2016, pp. 409--420."},{"key":"e_1_3_2_1_16_1","first-page":"1","author":"Yang C.","year":"2017","unstructured":"C. Yang , J. Sheng , R. Patel , A. Sanaullah , V. Sachdeva , and M. C. Herbordt , \"OpenCL for HPC with FPGAs: Case Study in Molecular Electrostatics,\" in IEEE High Performance Extreme Computing Conference , 2017 , pp. 1 -- 8 . C. Yang, J. Sheng, R. Patel, A. Sanaullah, V. Sachdeva, and M. C. Herbordt, \"OpenCL for HPC with FPGAs: Case Study in Molecular Electrostatics,\" in IEEE High Performance Extreme Computing Conference, 2017, pp. 1--8.","journal-title":"\"OpenCL for HPC with FPGAs: Case Study in Molecular Electrostatics,\" in IEEE High Performance Extreme Computing Conference"},{"key":"e_1_3_2_1_17_1","first-page":"76","volume-title":"Int. Symp. Field-Programmable Custom Computing Machines. IEEE","author":"Abedalmuhdi A.","year":"2017","unstructured":"A. Abedalmuhdi , B. E. Wells , and K.-I. Nishikawa , \" Efficient Particle-Grid Space Interpolation of an FPGA-Accelerated Particle-in-Cell Plasma Simulation,\" in Proc . Int. Symp. Field-Programmable Custom Computing Machines. IEEE , 2017 , pp. 76 -- 79 . A. Abedalmuhdi, B. E. Wells, and K.-I. Nishikawa, \"Efficient Particle-Grid Space Interpolation of an FPGA-Accelerated Particle-in-Cell Plasma Simulation,\" in Proc. Int. Symp. Field-Programmable Custom Computing Machines. IEEE, 2017, pp. 76--79."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-56154-7_45"},{"key":"e_1_3_2_1_19_1","first-page":"89","volume-title":"FPGA Implementation of a Dense Optical Flow Algorithm using Altera OpenCL SDK,\" in International Conference on ICT Innovations","author":"Ulutas U.","year":"2017","unstructured":"U. Ulutas , M. Tosun , V. E. Levent , D. B\u00fcy\u00fckayd\u0131n , T. Akg\u00fcn , and H. F. Ugurdag , \" FPGA Implementation of a Dense Optical Flow Algorithm using Altera OpenCL SDK,\" in International Conference on ICT Innovations . Springer , 2017 , pp. 89 -- 101 . U. Ulutas, M. Tosun, V. E. Levent, D. B\u00fcy\u00fckayd\u0131n, T. Akg\u00fcn, and H. F. Ugurdag, \"FPGA Implementation of a Dense Optical Flow Algorithm using Altera OpenCL SDK,\" in International Conference on ICT Innovations. Springer, 2017, pp. 89--101."},{"key":"e_1_3_2_1_20_1","unstructured":"P. Eastman and V. Pande \"OpenMM: a Hardware-Independent Framework for Molecular Simulations.\"  P. Eastman and V. Pande \"OpenMM: a Hardware-Independent Framework for Molecular Simulations.\""},{"key":"e_1_3_2_1_22_1","unstructured":"Altera \"FFT IP Core User Guide \" www.altera.com\/documentation\/hco1419012539637.html accessed: 2010-08-29.  Altera \"FFT IP Core User Guide \" www.altera.com\/documentation\/hco1419012539637.html accessed: 2010-08-29."},{"key":"e_1_3_2_1_23_1","unstructured":"Intel \"Computing an FFT \" https:\/\/software.intel.com\/en-us\/mkl-developer-reference-c-computing-an-fft 2018.  Intel \"Computing an FFT \" https:\/\/software.intel.com\/en-us\/mkl-developer-reference-c-computing-an-fft 2018."},{"key":"e_1_3_2_1_24_1","unstructured":"NVIDIA \"CUFFT library \" http:\/\/docs.nvidia.com\/cuda\/cufft 2018.  NVIDIA \"CUFFT library \" http:\/\/docs.nvidia.com\/cuda\/cufft 2018."}],"event":{"name":"HEART 2018: The 9th International Symposium on Highly-Efficient Accelerators and Reconfigurable Technologies","location":"Toronto ON Canada","acronym":"HEART 2018"},"container-title":["Proceedings of the 9th International Symposium on Highly-Efficient Accelerators and Reconfigurable Technologies"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3241793.3241800","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3241793.3241800","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3241793.3241800","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T02:08:10Z","timestamp":1750212490000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3241793.3241800"}},"subtitle":["Case Study in 3D FFT"],"short-title":[],"issued":{"date-parts":[[2018,6,20]]},"references-count":23,"alternative-id":["10.1145\/3241793.3241800","10.1145\/3241793"],"URL":"https:\/\/doi.org\/10.1145\/3241793.3241800","relation":{},"subject":[],"published":{"date-parts":[[2018,6,20]]},"assertion":[{"value":"2018-06-20","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}