{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,5]],"date-time":"2026-05-05T04:16:49Z","timestamp":1777954609324,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":98,"publisher":"ACM","funder":[{"DOI":"10.13039\/501100006374","name":"National Science Foundation","doi-asserted-by":"publisher","award":["CCF-2318633"],"award-info":[{"award-number":["CCF-2318633"]}],"id":[{"id":"10.13039\/501100006374","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,7,16]]},"DOI":"10.1145\/3694906.3743354","type":"proceedings-article","created":{"date-parts":[[2025,7,16]],"date-time":"2025-07-16T16:19:56Z","timestamp":1752682796000},"page":"17-33","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Applying Fast Fourier Transforms to Accelerate Spatially and Temporally Inhomogeneous Stencil Computations"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0008-1198-526X","authenticated-orcid":false,"given":"Russell","family":"Bentley","sequence":"first","affiliation":[{"name":"Stony Brook University"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7022-5278","authenticated-orcid":false,"given":"Rezaul","family":"Chowdhury","sequence":"additional","affiliation":[{"name":"Stony Brook University"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-2836-1727","authenticated-orcid":false,"given":"Aaron","family":"Gregory","sequence":"additional","affiliation":[{"name":"Stony Brook University"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-6792-8548","authenticated-orcid":false,"given":"Michael","family":"Santomauro","sequence":"additional","affiliation":[{"name":"Stony Brook University"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,7,16]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"PLuTo. An automatic parallelizer and locality optimizer for affine loop nests. http:\/\/pluto-compiler.sourceforge.net\/."},{"key":"e_1_3_2_1_2_1","unstructured":"Rayon. Rayon-1.10.0. https:\/\/github.com\/rayon-rs\/rayon."},{"key":"e_1_3_2_1_3_1","unstructured":"Rust. The Rust Programming Language. https:\/\/www.rust-lang.org\/."},{"key":"e_1_3_2_1_4_1","unstructured":"Stampede3. The Stampede3 supercomputing cluster. https:\/\/www.tacc.utexas.edu\/systems\/stampede3."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.sysconle.2010.03.002"},{"key":"e_1_3_2_1_6_1","volume-title":"Fast American option pricing using nonlinear stencils. arXiv preprint arXiv:2303.02317","author":"Ahmad Zafar","year":"2023","unstructured":"Zafar Ahmad, Reilly Browne, Rezaul Chowdhury, Rathish Das, Yushen Huang, and Yimin Zhu. 2023. Fast American option pricing using nonlinear stencils. arXiv preprint arXiv:2303.02317 (2023)."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/3627535.3638506"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/3409964.3461803"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/3490148.3538558"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/3606338"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611978759.21"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISPASS55109.2022.00010"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jcp.2016.11.033"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1002\/fld.3999"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1177\/1687814015591937"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1175\/1520-0493(1989)117<2113:APOHLS>2.0.CO;2"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/VG.2005.194111"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"crossref","unstructured":"Jiri Blazek. 2015. Computational Fluid Dynamics: Principles and Applications. Butterworth-Heinemann.","DOI":"10.1016\/B978-0-08-099995-1.00012-9"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"crossref","unstructured":"Timothy J Boerner Stephen Deems Thomas R Furlani Shelley L Knuth and John Towns. 2023. ACCESS: Advancing Innovation: NSF's Advanced Cyberinfrastructure Coordination Ecosystem: Services & Support. In Practice and Experience in Advanced Research Computing 2023: Computing for the Common Good. 173--176.","DOI":"10.1145\/3569951.3597559"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/1375581.1375595"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1137\/0804017"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/TASSP.1978.1163036"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1137\/0730089"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1137\/0721020"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1111\/j.1467-8659.2008.01210.x"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3627535.3638476"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2011.70"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1090\/S0025-5718-1965-0178586-1"},{"key":"e_1_3_2_1_29_1","volume-title":"Introduction to Algorithms","author":"Cormen Thomas H","unstructured":"Thomas H Cormen, Charles E Leiserson, Ronald L Rivest, and Clifford Stein. 2022. Introduction to Algorithms. MIT Press."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1017\/S0305004100023197"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1137\/S1064827592240555"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1137\/040615195"},{"key":"e_1_3_2_1_33_1","volume-title":"Computational Methods for Fluid Dynamics","author":"Ferziger Joel H","unstructured":"Joel H Ferziger, Milovan Peri\u0107, and Robert L Street. 2002. Computational Methods for Fluid Dynamics. Vol. 3. Springer."},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1063\/1.533339"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2004.840301"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/SFFCS.1999.814600"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1145\/1088149.1088197"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1086\/374594"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jcp.2014.09.023"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.camwa.2012.12.006"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1006\/jcom.1994.1021"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/EMBC.2012.6346739"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1111\/j.2517-6161.1958.tb00300.x"},{"key":"e_1_3_2_1_44_1","volume-title":"Toeplitz and Circulant Matrices: A Review","author":"Gray Robert M","unstructured":"Robert M Gray. 2006. Toeplitz and Circulant Matrices: A Review. Now Publishers Inc."},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-46375-7_5"},{"key":"e_1_3_2_1_46_1","volume-title":"Numerical Computation of Internal and External Flows: The Fundamentals of Computational Fluid Dynamics","author":"Hirsch Charles","unstructured":"Charles Hirsch. 2007. Numerical Computation of Internal and External Flows: The Fundamentals of Computational Fluid Dynamics. Elsevier."},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1080\/00029890.1998.12004985"},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1063\/1.3034415"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.matpr.2021.02.058"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00466-014-1071-8"},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.1175\/1520-0477(1990)071<1410:GNWPAT>2.0.CO;2"},{"key":"e_1_3_2_1_52_1","volume-title":"Simulating a dual-array electrode configuration to investigate the influence of skeletal muscle fatigue following functional electrical stimulation. Computers in biology and medicine 42, 9","author":"Kim Juliana HK","year":"2012","unstructured":"Juliana HK Kim, Mark L Trew, Andrew J Pullan, and Oliver R\u00f6hrle. 2012. Simulating a dual-array electrode configuration to investigate the influence of skeletal muscle fatigue following functional electrical stimulation. Computers in biology and medicine 42, 9 (2012), 915--924."},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.1137\/17M1133208"},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1007\/BF01060070"},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"publisher","DOI":"10.1046\/j.1365-8711.2002.05313.x"},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.1145\/2491956.2462187"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"crossref","unstructured":"Matthias Korch and Tim Werner. 2020. An in-depth introduction of multi-workgroup tiling for improving the locality of explicit one-step methods for ODE systems with limited access distance on GPUs. Concurrency and Computation: Practice and Experience (2020) e6016.","DOI":"10.1002\/cpe.6016"},{"key":"e_1_3_2_1_58_1","doi-asserted-by":"publisher","DOI":"10.1137\/S0036144504445376"},{"key":"e_1_3_2_1_59_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.cam.2009.05.028"},{"key":"e_1_3_2_1_60_1","doi-asserted-by":"publisher","DOI":"10.1186\/s42492-018-0009-y"},{"key":"e_1_3_2_1_61_1","doi-asserted-by":"publisher","DOI":"10.5194\/gmd-12-1165-2019"},{"key":"e_1_3_2_1_62_1","doi-asserted-by":"publisher","DOI":"10.1137\/140984002"},{"key":"e_1_3_2_1_63_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.cnsns.2014.08.021"},{"key":"e_1_3_2_1_64_1","doi-asserted-by":"publisher","DOI":"10.1006\/jcph.1997.5856"},{"key":"e_1_3_2_1_65_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jafrearsci.2018.10.016"},{"key":"e_1_3_2_1_66_1","doi-asserted-by":"publisher","DOI":"10.1002\/nla.542"},{"key":"e_1_3_2_1_67_1","doi-asserted-by":"publisher","DOI":"10.1109\/22.903100"},{"key":"e_1_3_2_1_68_1","doi-asserted-by":"publisher","DOI":"10.1109\/MCSE.2011.71"},{"key":"e_1_3_2_1_69_1","doi-asserted-by":"publisher","DOI":"10.2298\/SJEE1301165P"},{"key":"e_1_3_2_1_70_1","doi-asserted-by":"publisher","DOI":"10.1016\/0370-1573(89)90024-0"},{"key":"e_1_3_2_1_71_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-11821-0"},{"key":"e_1_3_2_1_72_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jsv.2015.09.033"},{"key":"e_1_3_2_1_73_1","doi-asserted-by":"publisher","DOI":"10.1080\/07055900.1981.9649098"},{"key":"e_1_3_2_1_74_1","doi-asserted-by":"crossref","DOI":"10.2151\/jmsj1965.60.1_319","article-title":"A semi-Lagrangian and semi-implicit numerical integration scheme for the primitive meteorological equations","author":"Robert Andre","year":"1982","unstructured":"Andre Robert. 1982. A semi-Lagrangian and semi-implicit numerical integration scheme for the primitive meteorological equations. Journal of the Meteorological Society of Japan. Ser. II 60, 1 (1982), 319--325.","journal-title":"Journal of the Meteorological Society of Japan. Ser."},{"key":"e_1_3_2_1_75_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.promfg.2015.09.012"},{"key":"e_1_3_2_1_76_1","doi-asserted-by":"publisher","DOI":"10.1063\/1.4823282"},{"key":"e_1_3_2_1_77_1","doi-asserted-by":"publisher","DOI":"10.5555\/3037518.3037519"},{"key":"e_1_3_2_1_78_1","doi-asserted-by":"publisher","DOI":"10.1016\/0021-9991(88)90102-7"},{"key":"e_1_3_2_1_79_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jocs.2016.05.007"},{"key":"e_1_3_2_1_80_1","doi-asserted-by":"publisher","DOI":"10.1007\/BF01082526"},{"key":"e_1_3_2_1_81_1","doi-asserted-by":"publisher","DOI":"10.1137\/0721062"},{"key":"e_1_3_2_1_82_1","doi-asserted-by":"publisher","DOI":"10.1115\/1.1849175"},{"key":"e_1_3_2_1_83_1","volume-title":"Computational Electrodynamics: The Finite-difference Time-domain Method","author":"Taflove Allen","year":"2005","unstructured":"Allen Taflove and Susan C Hagness. 2005. Computational Electrodynamics: The Finite-difference Time-domain Method. Artech House."},{"key":"e_1_3_2_1_84_1","doi-asserted-by":"publisher","DOI":"10.1145\/1989493.1989508"},{"key":"e_1_3_2_1_85_1","volume-title":"Poster. USENIX Workshop on Hot Topics in Parallelism.","author":"Tang Yuan","year":"2011","unstructured":"Yuan Tang, Rezaul Chowdhury, Chi-Keung Luk, and Charles E Leiserson. 2011. Coding stencil computations using the Pochoir stencil-specification language. In Poster. USENIX Workshop on Hot Topics in Parallelism."},{"key":"e_1_3_2_1_86_1","unstructured":"Jesmin Jahan Tithi. 2015. Engineering high-performance parallel algorithms with applications to bioinformatics. Ph.D. Dissertation. State University of New York at Stony Brook."},{"key":"e_1_3_2_1_87_1","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPSW.2013.241"},{"key":"e_1_3_2_1_88_1","doi-asserted-by":"publisher","DOI":"10.1016\/0024-3795(94)00025-5"},{"key":"e_1_3_2_1_89_1","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511615115"},{"key":"e_1_3_2_1_90_1","doi-asserted-by":"publisher","DOI":"10.1080\/01495728408961817"},{"key":"e_1_3_2_1_91_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-56802-2"},{"key":"e_1_3_2_1_92_1","doi-asserted-by":"publisher","DOI":"10.1137\/S0036142901396715"},{"key":"e_1_3_2_1_93_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-7091-6586-7_13"},{"key":"e_1_3_2_1_94_1","first-page":"33","article-title":"Applications of nonlinear diffusion in image processing and computer vision","volume":"70","author":"Weickert Joachim","year":"2001","unstructured":"Joachim Weickert. 2001. Applications of nonlinear diffusion in image processing and computer vision. Acta Math. Univ. Comenianae 70, 1 (2001), 33--50.","journal-title":"Acta Math. Univ. Comenianae"},{"key":"e_1_3_2_1_95_1","doi-asserted-by":"publisher","DOI":"10.1093\/imanum\/16.4.583"},{"key":"e_1_3_2_1_96_1","doi-asserted-by":"publisher","DOI":"10.1090\/S0025-5718-1978-0468306-4"},{"key":"e_1_3_2_1_97_1","doi-asserted-by":"publisher","DOI":"10.1137\/030602666"},{"key":"e_1_3_2_1_98_1","doi-asserted-by":"publisher","DOI":"10.3390\/coatings12091277"}],"event":{"name":"SPAA '25: 37th ACM Symposium on Parallelism in Algorithms and Architectures","location":"Portland OR USA","acronym":"SPAA '25","sponsor":["SIGACT ACM Special Interest Group on Algorithms and Computation Theory","SIGARCH ACM Special Interest Group on Computer Architecture","EATCS European Association for Theoretical Computer Science"]},"container-title":["Proceedings of the 37th ACM Symposium on Parallelism in Algorithms and Architectures"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3694906.3743354","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T19:19:57Z","timestamp":1777922397000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3694906.3743354"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,7,16]]},"references-count":98,"alternative-id":["10.1145\/3694906.3743354","10.1145\/3694906"],"URL":"https:\/\/doi.org\/10.1145\/3694906.3743354","relation":{},"subject":[],"published":{"date-parts":[[2025,7,16]]},"assertion":[{"value":"2025-07-16","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}