{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,2]],"date-time":"2026-04-02T21:53:03Z","timestamp":1775166783684,"version":"3.50.1"},"reference-count":103,"publisher":"Springer Science and Business Media LLC","issue":"7","license":[{"start":{"date-parts":[[2018,4,27]],"date-time":"2018-04-27T00:00:00Z","timestamp":1524787200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100003141","name":"Consejo Nacional de Ciencia y Tecnolog\u00eda","doi-asserted-by":"publisher","award":["342814"],"award-info":[{"award-number":["342814"]}],"id":[{"id":"10.13039\/501100003141","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Google (US) and Tides Foundation","award":["TFR15-00145"],"award-info":[{"award-number":["TFR15-00145"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Supercomput"],"published-print":{"date-parts":[[2018,7]]},"DOI":"10.1007\/s11227-018-2392-8","type":"journal-article","created":{"date-parts":[[2018,4,27]],"date-time":"2018-04-27T00:40:40Z","timestamp":1524789640000},"page":"3441-3467","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":20,"title":["Physically based visual simulation of the Lattice Boltzmann method on the GPU: a survey"],"prefix":"10.1007","volume":"74","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-6801-8317","authenticated-orcid":false,"given":"Octavio","family":"Navarro-Hinojosa","sequence":"first","affiliation":[]},{"given":"Sergio","family":"Ruiz-Loza","sequence":"additional","affiliation":[]},{"given":"Mois\u00e9s","family":"Alencastre-Miranda","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,4,27]]},"reference":[{"key":"2392_CR1","doi-asserted-by":"publisher","DOI":"10.1016\/B978-044451612-1\/50007-X","volume-title":"Parallel algorithms of direct solving the Boltzmann equation in aerodynamics problems","author":"VV Aristov","year":"2004","unstructured":"Aristov VV, Frolova AA, Zabelok SA (2004) Parallel algorithms of direct solving the Boltzmann equation in aerodynamics problems. Elsevier, Amsterdam"},{"issue":"59","key":"2392_CR2","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1007\/BF03322610","volume":"56","author":"M Astorino","year":"2012","unstructured":"Astorino M, Becerra Sagredo J, Quarteroni A (2012) A modular lattice Boltzmann solver for GPU computing processors. SeMA J 56(59):53\u201378","journal-title":"SeMA J"},{"key":"2392_CR3","doi-asserted-by":"crossref","unstructured":"Audigier C, Mansi T, Delingette H, Rapaka S, Mihalef V, Sharma P, Carnegie D, Boctor E, Choti M, Kamen A et al (2013) Lattice Boltzmann method for fast patient-specific simulation of liver tumor ablation from CT images. In: International Conference on Medical Image Computing and Computer-Assisted Intervention. Springer, Berlin, pp 323\u2013330","DOI":"10.1007\/978-3-642-40760-4_41"},{"key":"2392_CR4","doi-asserted-by":"crossref","unstructured":"Bailey P, Myre J, Walsh SD, Lilja DJ, Saar MO (2009) Accelerating lattice Boltzmann fluid flow simulations using graphics processors. In: Parallel Processing, 2009. ICPP\u201909. International Conference on. IEEE, pp 550\u2013557","DOI":"10.1109\/ICPP.2009.38"},{"issue":"1","key":"2392_CR5","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1002\/cpe.1466","volume":"22","author":"M Bernaschi","year":"2010","unstructured":"Bernaschi M, Fatica M, Melchionna S, Succi S, Kaxiras E (2010) A flexible high-performance lattice Boltzmann GPU code for the simulations of fluid flows in complex geometries. Concurr Comput Pract Exp 22(1):1\u201314","journal-title":"Concurr Comput Pract Exp"},{"issue":"6","key":"2392_CR6","doi-asserted-by":"publisher","first-page":"066,707","DOI":"10.1103\/PhysRevE.80.066707","volume":"80","author":"M Bernaschi","year":"2009","unstructured":"Bernaschi M, Rossi L, Benzi R, Sbragaglia M, Succi S (2009) Graphics processing unit implementation of lattice Boltzmann models for flowing soft systems. Phys Rev E 80(6):066,707","journal-title":"Phys Rev E"},{"key":"2392_CR7","doi-asserted-by":"crossref","unstructured":"Bertazzo A, Mantovani F, Pivanti M, Pozzati F, Schifano SF, Tripiccione R (2012) Implementation and optimization of a thermal lattice Boltzmann algorithm on a multi-GPU cluster. In: 2012 innovative parallel computing, InPar 2012","DOI":"10.1109\/InPar.2012.6339603"},{"issue":"1","key":"2392_CR8","doi-asserted-by":"publisher","first-page":"55","DOI":"10.1016\/j.compfluid.2012.06.003","volume":"80","author":"L Biferale","year":"2013","unstructured":"Biferale L, Mantovani F, Pivanti M, Pozzati F, Sbragaglia M, Scagliarini A, Schifano SF, Toschi F, Tripiccione R (2013) An optimized D2Q37 lattice Boltzmann code on GP-GPUs. Comput Fluids 80(1):55\u201362. \n                    https:\/\/doi.org\/10.1016\/j.compfluid.2012.06.003","journal-title":"Comput Fluids"},{"issue":"01","key":"2392_CR9","doi-asserted-by":"publisher","first-page":"48","DOI":"10.4208\/cicp.210910.250311a","volume":"11","author":"M Bisson","year":"2012","unstructured":"Bisson M, Bernaschi M, Melchionna S, Succi S, Kaxiras E (2012) Multiscale hemodynamics using GPU clusters. Commun Comput Phys 11(01):48\u201364","journal-title":"Commun Comput Phys"},{"key":"2392_CR10","doi-asserted-by":"crossref","unstructured":"Blair S, Albing C, Grund A, Jocksch A (2015) Accelerating an MPI lattice Boltzmann code using OpenACC. In: Proceedings of the second workshop on accelerator programming using directives. ACM, p\u00a03","DOI":"10.1145\/2832105.2832111"},{"issue":"12","key":"2392_CR11","doi-asserted-by":"publisher","first-page":"1745","DOI":"10.1243\/09544062JMES813FT","volume":"221","author":"T Brandvik","year":"2007","unstructured":"Brandvik T, Pullan G (2007) Acceleration of a two-dimensional Euler flow solver using commodity graphics hardware. Proc Inst Mech Eng Part C J Mech Eng Sci 221(12):1745\u20131748","journal-title":"Proc Inst Mech Eng Part C J Mech Eng Sci"},{"key":"2392_CR12","doi-asserted-by":"crossref","unstructured":"Brandvik T, Pullan G (2008) Acceleration of a 3D Euler solver using commodity graphics hardware. In: 46th AIAA aerospace sciences meeting and exhibit, pp 1\u201315","DOI":"10.2514\/6.2008-607"},{"key":"2392_CR13","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.parco.2016.08.005","volume":"58","author":"E Calore","year":"2016","unstructured":"Calore E, Gabbana A, Kraus J, Pellegrini E, Schifano S, Tripiccione R (2016) Massively parallel lattice-Boltzmann codes on large GPU clusters. Parallel Comput 58:1\u201324","journal-title":"Parallel Comput"},{"issue":"12","key":"2392_CR14","doi-asserted-by":"publisher","first-page":"3485","DOI":"10.1002\/cpe.3862","volume":"28","author":"E Calore","year":"2016","unstructured":"Calore E, Gabbana A, Kraus J, Schifano SF, Tripiccione R (2016) Performance and portability of accelerated lattice Boltzmann applications with OpenACC. Concurr Comput Pract Exp 28(12):3485\u20133502","journal-title":"Concurr Comput Pract Exp"},{"key":"2392_CR15","doi-asserted-by":"publisher","first-page":"40","DOI":"10.1016\/j.procs.2014.05.004","volume":"29","author":"E Calore","year":"2014","unstructured":"Calore E, Schifano SF, Tripiccione R (2014) A portable OpenCL lattice Boltzmann code for multi-and many-core processor architectures. Proc Comput Sci 29:40\u201349","journal-title":"Proc Comput Sci"},{"key":"2392_CR16","doi-asserted-by":"publisher","first-page":"70","DOI":"10.1016\/j.cam.2015.02.008","volume":"295","author":"J Campos","year":"2016","unstructured":"Campos J, Oliveira RS, dos Santos RW, Rocha BM (2016) Lattice Boltzmann method for parallel simulations of cardiac electrophysiology using GPUs. J Comput Appl Math 295:70\u201382","journal-title":"J Comput Appl Math"},{"key":"2392_CR17","volume-title":"Professional CUDA C programming","author":"J Cheng","year":"2014","unstructured":"Cheng J, Grossman M, McKercher T (2014) Professional CUDA C programming. Wiley, New York"},{"key":"2392_CR18","doi-asserted-by":"crossref","unstructured":"Chu NSH, Tai CL (2005) MoXi: real-time ink dispersion in absorbent paper. ACM Trans Graph. 24(3):504\u2013511. \n                    http:\/\/visgraph.cs.ust.hk\/MoXi\/","DOI":"10.1145\/1073204.1073221"},{"key":"2392_CR19","unstructured":"Clough D (2014) Lattice Boltzmann liquid simulations on graphics hardware, Ph.D. thesis. University of Cape Town"},{"key":"2392_CR20","unstructured":"Corporation N (2016) Parallel programming and computing platform. \n                    http:\/\/www.nvidia.com\/object\/cuda_home_new.html\n                    \n                  . Accessed 11 May 2016"},{"issue":"2","key":"2392_CR21","doi-asserted-by":"publisher","first-page":"462","DOI":"10.1016\/j.camwa.2013.10.002","volume":"67","author":"N Delbosc","year":"2014","unstructured":"Delbosc N, Summers JL, Khan A, Kapur N, Noakes CJ (2014) Optimized implementation of the lattice Boltzmann method on a graphics processing unit towards real-time fluid simulation. Comput Math Appl 67(2):462\u2013475","journal-title":"Comput Math Appl"},{"key":"2392_CR22","doi-asserted-by":"publisher","DOI":"10.1016\/B978-044451612-1\/50009-3","volume-title":"Parallel algorithm for numerical simulation of 3D incompressible flows","author":"T Elizarova","year":"2004","unstructured":"Elizarova T, Milyukova OY (2004) Parallel algorithm for numerical simulation of 3D incompressible flows. Elsevier, Amsterdam"},{"key":"2392_CR23","unstructured":"Evans MW, Harlow FH, Bromberg E (1957) The particle-in-cell-method for hydrodynamic calculations, Technical report. DTIC Document"},{"issue":"1","key":"2392_CR24","first-page":"47","volume":"00","author":"Z Fan","year":"2004","unstructured":"Fan Z, Qiu F, Kaufman A, Yoakum-stover S (2004) GPU cluster for high performance computing. IEEE Supercomput 00(1):47","journal-title":"IEEE Supercomput"},{"issue":"9","key":"2392_CR25","doi-asserted-by":"publisher","first-page":"536","DOI":"10.1016\/j.parco.2011.03.005","volume":"37","author":"C Feichtinger","year":"2011","unstructured":"Feichtinger C, Habich J, K\u00f6stler H, Hager G, R\u00fcde U, Wellein G (2011) A flexible patch-based lattice Boltzmann parallelization approach for heterogeneous GPU\u2013CPU clusters. Parallel Comput 37(9):536\u2013549","journal-title":"Parallel Comput"},{"key":"2392_CR26","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.parco.2014.12.003","volume":"46","author":"C Feichtinger","year":"2015","unstructured":"Feichtinger C, Habich J, K\u00f6stler H, R\u00fcde U, Aoki T (2015) Performance modeling and analysis of heterogeneous lattice Boltzmann simulations on CPU\u2013GPU clusters. Parallel Comput 46:1\u201313","journal-title":"Parallel Comput"},{"key":"2392_CR27","volume-title":"Computational methods for fluid dynamics","author":"JH Ferziger","year":"2012","unstructured":"Ferziger JH, Peric M (2012) Computational methods for fluid dynamics. Springer, Berlin"},{"key":"2392_CR28","doi-asserted-by":"publisher","first-page":"392","DOI":"10.1016\/j.proeng.2013.08.033","volume":"61","author":"D Gaudlitz","year":"2013","unstructured":"Gaudlitz D, Landmann B, Indinger T (2013) Accelerated CFD simulations using Eulerian and Lagrangian methods on GPUs. Proc Eng 61:392\u2013397","journal-title":"Proc Eng"},{"key":"2392_CR29","doi-asserted-by":"crossref","unstructured":"Geveler M, Ribbrock D, G\u00f6ddeke D, Turek S (2010) Lattice-Boltzmann simulation of the shallow-water equations with fluid\u2013structure interaction on multi-and manycore processors. In: Facing the multicore-challenge. Springer, Berlin, pp 92\u2013104","DOI":"10.1007\/978-3-642-16233-6_11"},{"key":"2392_CR30","unstructured":"Goodnight N, Lewin G, Luebke D, Skadron K (2003) A multigrid solver for boundary value problems using programmable graphics hardware. In: ACM SIGGRAPH 2005 Courses, p 193"},{"key":"2392_CR31","doi-asserted-by":"crossref","unstructured":"Guo X, Li W, Iorio F (2016) Convolutional neural networks for steady flow approximation. In: Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining. ACM, pp 481\u2013490","DOI":"10.1145\/2939672.2939738"},{"issue":"1","key":"2392_CR32","doi-asserted-by":"publisher","first-page":"276","DOI":"10.1016\/j.compfluid.2012.02.013","volume":"80","author":"J Habich","year":"2013","unstructured":"Habich J, Feichtinger C, K\u00f6stler H, Hager G, Wellein G (2013) Performance engineering for the lattice Boltzmann method on GPGPUs: architectural requirements and performance results. Comput Fluids 80(1):276\u2013282. \n                    https:\/\/doi.org\/10.1016\/j.compfluid.2012.02.013","journal-title":"Comput Fluids"},{"issue":"5","key":"2392_CR33","doi-asserted-by":"publisher","first-page":"266","DOI":"10.1016\/j.advengsoft.2010.10.007","volume":"42","author":"J Habich","year":"2011","unstructured":"Habich J, Zeiser T, Hager G, Wellein G (2011) Performance analysis and optimization strategies for a D3Q19 lattice Boltzmann kernel on nVIDIA GPUs using CUDA. Adv Eng Softw 42(5):266\u2013272","journal-title":"Adv Eng Softw"},{"key":"2392_CR34","unstructured":"Harris MJ (2004) GPU gems\u2014chapter 38. Fast fluid dynamics simulation on the GPU. GPU Gems 3. \n                    https:\/\/developer.nvidia.com\/gpugems\/GPUGems\/gpugems_ch38.html\n                    \n                  . Accessed 04 May 2017"},{"key":"2392_CR35","doi-asserted-by":"publisher","first-page":"363","DOI":"10.1016\/j.advengsoft.2017.10.005","volume":"115","author":"AR Harwood","year":"2018","unstructured":"Harwood AR, Revell AJ (2018) Interactive flow simulation using Tegra-powered mobile devices. Adv Eng Softw 115:363\u2013373","journal-title":"Adv Eng Softw"},{"issue":"3\u20134","key":"2392_CR36","doi-asserted-by":"publisher","first-page":"927","DOI":"10.1023\/B:JOSS.0000015179.12689.e4","volume":"88","author":"X He","year":"1997","unstructured":"He X, Luo LS (1997) Lattice Boltzmann model for the incompressible Navier\u2013Stokes equation. J Stat Phys 88(3\u20134):927\u2013944","journal-title":"J Stat Phys"},{"key":"2392_CR37","unstructured":"Hennigh O (2017) Lat-net: compressing lattice Boltzmann flow simulations using deep neural networks. arXiv preprint \n                    arXiv:1705.09036"},{"issue":"1","key":"2392_CR38","doi-asserted-by":"publisher","first-page":"201","DOI":"10.1016\/0021-9991(81)90145-5","volume":"39","author":"CW Hirt","year":"1981","unstructured":"Hirt CW, Nichols BD (1981) Volume of fluid (VOF) method for the dynamics of free boundaries. J Comput Phys 39(1):201\u2013225","journal-title":"J Comput Phys"},{"key":"2392_CR39","volume-title":"Numerical methods in fluid dynamics","author":"M Holt","year":"2012","unstructured":"Holt M (2012) Numerical methods in fluid dynamics. Springer, Berlin"},{"key":"2392_CR40","unstructured":"Information GS, Center C (2017) Tsubame2. \n                    http:\/\/www.gsic.titech.ac.jp\/en\/tsubame2\n                    \n                  . Accessed 04 May 2017"},{"key":"2392_CR41","doi-asserted-by":"crossref","unstructured":"Jain S, Tripathi N, Narayanan PJ (2014) Interactive simulation of generalised Newtonian fluids using GPUs. In: Proceedings of the 2014 Indian Conference on Computer Vision Graphics and Image Processing. ACM, p\u00a079","DOI":"10.1145\/2683483.2683562"},{"issue":"12","key":"2392_CR42","doi-asserted-by":"publisher","first-page":"3549","DOI":"10.1016\/j.camwa.2011.03.016","volume":"61","author":"C Jan\u00dfen","year":"2011","unstructured":"Jan\u00dfen C, Krafczyk M (2011) Free surface flow simulations on GPGPUs using the LBM. Comput Math Appl 61(12):3549\u20133563. \n                    https:\/\/doi.org\/10.1016\/j.camwa.2011.03.016","journal-title":"Comput Math Appl"},{"issue":"9","key":"2392_CR43","doi-asserted-by":"publisher","first-page":"2350","DOI":"10.1016\/j.cpc.2014.04.018","volume":"185","author":"M Januszewsky","year":"2014","unstructured":"Januszewsky M, Kostur M (2014) Sailfish, a flexible multi-GPU implementation of the lattice Boltzmann method. Comput Phys Commun 185(9):2350\u20132368","journal-title":"Comput Phys Commun"},{"issue":"5","key":"2392_CR44","doi-asserted-by":"publisher","first-page":"723","DOI":"10.1007\/s11432-009-0091-z","volume":"52","author":"T Jie","year":"2009","unstructured":"Jie T, XuBo Y (2009) Physically-based fluid animation: a survey. Sci China Ser F Inf Sci 52(5):723\u2013740","journal-title":"Sci China Ser F Inf Sci"},{"key":"2392_CR45","unstructured":"Kraus J (2013) An introduction to CUDA-aware MPI. \n                    http:\/\/developer.nvidia.com\/content\/introduction-cuda-aware-mpi\n                    \n                  . Accessed 10 March 2017"},{"key":"2392_CR46","doi-asserted-by":"crossref","unstructured":"Kraus J, Pivanti M, Schifano SF, Tripiccione R, Zanella M (2013) Benchmarking GPUs with a parallel lattice-Boltzmann code. In: Proceedings of the symposium on computer architecture and high performance computing, pp 160\u2013167","DOI":"10.1109\/SBAC-PAD.2013.37"},{"key":"2392_CR47","unstructured":"Kryza T, Dzwinel W (2013) Coupling lattice Boltzmann gas and level set method for simulating free surface flow in GPU\/CUDA environment. In: International Conference on Parallel Processing and Applied Mathematics. Springer, Berlin, pp 731\u2013740"},{"issue":"7","key":"2392_CR48","doi-asserted-by":"publisher","first-page":"2380","DOI":"10.1016\/j.camwa.2009.08.052","volume":"59","author":"F Kuznik","year":"2010","unstructured":"Kuznik F, Obrecht C, Rusaouen G, Roux JJ (2010) LBM based flow simulation using GPU computing processor. Comput Math Appl 59(7):2380\u20132392","journal-title":"Comput Math Appl"},{"key":"2392_CR49","doi-asserted-by":"crossref","unstructured":"Li Q, Zhong C, Li K, Zhang G, Lu X, Zhang Q, Zhao K, Chu X (2012) Implementation of a lattice Boltzmann method for large eddy simulation on multiple GPUs. In: 2012 IEEE 14th International Conference on High Performance Computing and Communication & 2012 IEEE 9th International Conference on Embedded Software and Systems, pp 818\u2013823. \n                    http:\/\/ieeexplore.ieee.org\/lpdocs\/epic03\/wrapper.htm?arnumber=6332253","DOI":"10.1109\/HPCC.2012.115"},{"key":"2392_CR50","unstructured":"Li W, Fan Z, Wei X, Kaufman A (2005) GPU-based flow simulation with complex boundaries. In: GPU Gems 2. \n                    https:\/\/developer.nvidia.com\/gpugems\/GPUGems2\/gpugems2_chapter47.html\n                    \n                  . Accessed 25 Apr 2018"},{"issue":"7\u20138","key":"2392_CR51","doi-asserted-by":"publisher","first-page":"444","DOI":"10.1007\/s00371-003-0210-6","volume":"19","author":"W Li","year":"2003","unstructured":"Li W, Wei X, Kaufman A (2003) Implementing lattice Boltzmann computation on graphics hardware. Vis Comput 19(7\u20138):444\u2013456. \n                    https:\/\/doi.org\/10.1007\/s00371-003-0210-6","journal-title":"Vis Comput"},{"key":"2392_CR52","doi-asserted-by":"publisher","first-page":"209","DOI":"10.1016\/j.ces.2013.06.037","volume":"102","author":"X Li","year":"2013","unstructured":"Li X, Zhang Y, Wang X, Ge W (2013) GPU-based numerical simulation of multi-phase flow in porous media using multiple-relaxation-time lattice Boltzmann method. Chem Eng Sci 102:209\u2013219","journal-title":"Chem Eng Sci"},{"issue":"3","key":"2392_CR53","doi-asserted-by":"publisher","first-page":"200","DOI":"10.1016\/j.cpc.2006.09.005","volume":"176","author":"K Mattila","year":"2007","unstructured":"Mattila K, Hyv\u00e4luoma J, Rossi T, Aspn\u00e4s M, Westerholm J (2007) An efficient swap algorithm for the lattice Boltzmann method. Comput Phys Commun 176(3):200\u2013210","journal-title":"Comput Phys Commun"},{"issue":"10","key":"2392_CR54","doi-asserted-by":"publisher","first-page":"2566","DOI":"10.1016\/j.cpc.2014.06.003","volume":"185","author":"MJ Mawson","year":"2014","unstructured":"Mawson MJ, Revell AJ (2014) Memory transfer optimization for a lattice Boltzmann solver on Kepler architecture nVidia GPUs. Comput Phys Commun 185(10):2566\u20132574","journal-title":"Comput Phys Commun"},{"key":"2392_CR55","doi-asserted-by":"crossref","unstructured":"McIntosh-Smith S, Curran D (2014) Evaluation of a performance portable lattice Boltzmann code using OpenCL. In: Proceedings of the international workshop on OpenCL 2013 & 2014. ACM","DOI":"10.1145\/2664666.2664668"},{"issue":"3","key":"2392_CR56","doi-asserted-by":"publisher","first-page":"462","DOI":"10.1016\/j.cpc.2009.10.017","volume":"181","author":"S Melchionna","year":"2010","unstructured":"Melchionna S, Bernaschi M, Succi S, Kaxiras E, Rybicki FJ, Mitsouras D, Coskun AU, Feldman CL (2010) Hydrokinetic approach to large-scale cardiovascular blood flow. Comput Phys Commun 181(3):462\u2013472","journal-title":"Comput Phys Commun"},{"key":"2392_CR57","doi-asserted-by":"crossref","unstructured":"Mynam M, Sahasrabudhe N, Nandgaonkar A (2012) GPU implementation of a novel hybrid lattice Boltzmann method for non-isothermal flows. In: Proceedings of the 5th ACM Compute Conference: Intelligent & Scalable System Technologies. ACM, p\u00a07","DOI":"10.1145\/2459118.2459125"},{"issue":"4","key":"2392_CR58","doi-asserted-by":"publisher","first-page":"332","DOI":"10.1002\/cpe.1645","volume":"23","author":"J Myre","year":"2011","unstructured":"Myre J, Walsh SD, Lilja D, Saar MO (2011) Performance analysis of single-phase, multiphase, and multicomponent lattice-Boltzmann fluid flow simulations on GPU clusters. Concurr Comput Pract Exp 23(4):332\u2013350","journal-title":"Concurr Comput Pract Exp"},{"issue":"2","key":"2392_CR59","doi-asserted-by":"publisher","first-page":"528","DOI":"10.1007\/s11227-013-1015-7","volume":"67","author":"KE Niemeyer","year":"2014","unstructured":"Niemeyer KE, Sung CJ (2014) Recent progress and challenges in exploiting graphics processors in computational fluid dynamics. J Supercomput 67(2):528\u2013564","journal-title":"J Supercomput"},{"key":"2392_CR60","doi-asserted-by":"crossref","unstructured":"Nita C, Itu LM, Suciu C (2013) GPU accelerated blood flow computation using the lattice Boltzmann method. In: High Performance Extreme Computing Conference (HPEC), 2013 IEEE, pp 1\u20136","DOI":"10.1109\/HPEC.2013.6670324"},{"key":"2392_CR61","unstructured":"Obrecht C, Kuznik F, Tourancheau B, Roux JJ (2010) Global memory access modelling for efficient implementation of the lattice Boltzmann method on graphics processing units. In: International Conference on High Performance Computing for Computational Science. Springer, Berlin, pp 151\u2013161"},{"issue":"12","key":"2392_CR62","doi-asserted-by":"publisher","first-page":"3628","DOI":"10.1016\/j.camwa.2010.01.054","volume":"61","author":"C Obrecht","year":"2011","unstructured":"Obrecht C, Kuznik F, Tourancheau B, Roux JJ (2011) A new approach to the lattice Boltzmann method for graphics processsing units. Comput Math Appl 61(12):3628\u20133638","journal-title":"Comput Math Appl"},{"issue":"3","key":"2392_CR63","doi-asserted-by":"publisher","first-page":"295","DOI":"10.1177\/1094342011414745","volume":"23","author":"C Obrecht","year":"2011","unstructured":"Obrecht C, Kuznik F, Tourancheau B, Roux JJ (2011) The thelma project: multi-GPU implementation of the lattice Boltzmann method. Int J High Perform Comput Appl 23(3):295\u2013303","journal-title":"Int J High Perform Comput Appl"},{"key":"2392_CR64","doi-asserted-by":"publisher","first-page":"269","DOI":"10.1016\/j.compfluid.2012.02.014","volume":"80","author":"C Obrecht","year":"2013","unstructured":"Obrecht C, Kuznik F, Tourancheau B, Roux JJ (2013) Multi-GPU implementation of a hybrid thermal lattice Boltzmann solver using the TheLMA framework. Comput Fluids 80:269\u2013275","journal-title":"Comput Fluids"},{"issue":"2","key":"2392_CR65","doi-asserted-by":"publisher","first-page":"252","DOI":"10.1016\/j.camwa.2011.02.020","volume":"65","author":"C Obrecht","year":"2013","unstructured":"Obrecht C, Kuznik F, Tourancheau B, Roux JJ (2013) Multi-GPU implementation of the lattice Boltzmann method. Comput Math Appl 65(2):252\u2013261","journal-title":"Comput Math Appl"},{"issue":"6\u20137","key":"2392_CR66","doi-asserted-by":"publisher","first-page":"259","DOI":"10.1016\/j.parco.2013.04.001","volume":"39","author":"C Obrecht","year":"2013","unstructured":"Obrecht C, Kuznik F, Tourancheau B, Roux JJ (2013) Scalable lattice Boltzmann solvers for CUDA GPU clusters. Parallel Comput 39(6\u20137):259\u2013270","journal-title":"Parallel Comput"},{"issue":"2","key":"2392_CR67","doi-asserted-by":"publisher","first-page":"463","DOI":"10.1006\/jcph.2000.6636","volume":"169","author":"S Osher","year":"2001","unstructured":"Osher S, Fedkiw RP (2001) Level set methods: an overview and some recent results. J Comput Phys 169(2):463\u2013502","journal-title":"J Comput Phys"},{"key":"2392_CR68","doi-asserted-by":"publisher","first-page":"388","DOI":"10.1016\/j.proeng.2013.08.032","volume":"61","author":"S Posey","year":"2013","unstructured":"Posey S (2013) Considerations for GPU acceleration of parallel CFD. Proc Eng 61:388\u2013391","journal-title":"Proc Eng"},{"key":"2392_CR69","doi-asserted-by":"crossref","unstructured":"Potluri S, Wang H, Bureddy D, Singh AK, Rosales C, Panda DK (2012) Optimizing MPI communication on multi-GPU systems using CUDA inter-process communication. In: Parallel and distributed processing symposium workshops & PhD forum (IPDPSW), 2012 IEEE 26th international. IEEE, pp 1848\u20131857","DOI":"10.1109\/IPDPSW.2012.228"},{"issue":"6","key":"2392_CR70","doi-asserted-by":"publisher","first-page":"479","DOI":"10.1209\/0295-5075\/17\/6\/001","volume":"17","author":"Y Qian","year":"1992","unstructured":"Qian Y, d\u2019Humi\u00e8res D, Lallemand P (1992) Lattice BGK models for Navier\u2013Stokes equation. EPL (Europhys Lett) 17(6):479","journal-title":"EPL (Europhys Lett)"},{"key":"2392_CR71","unstructured":"Qiu FQF, Zhao YZY, Fan ZFZ, Wei XWX, Lorenz H, Wang JWJ, Yoakum-Stover S, Kaufman A, Mueller K (2004) Dispersion simulation and visualization for urban security. In: IEEE visualization 2004, pp 553\u2013560. \n                    http:\/\/ieeexplore.ieee.org\/xpls\/abs_all.jsp?arnumber=1372242"},{"key":"2392_CR72","doi-asserted-by":"publisher","first-page":"163","DOI":"10.1016\/j.simpat.2012.03.004","volume":"25","author":"PR Rinaldi","year":"2012","unstructured":"Rinaldi PR, Dari EA, V\u00e9nere MJ, Clausse A (2012) A lattice-Boltzmann solver for 3D fluid simulation on GPU. Simul Modell Pract Theory 25:163\u2013171. \n                    https:\/\/doi.org\/10.1016\/j.simpat.2012.03.004","journal-title":"Simul Modell Pract Theory"},{"key":"2392_CR73","doi-asserted-by":"crossref","unstructured":"Rosales C (2011) Multiphase LBM distributed over multiple GPUs. In: Cluster Computing (CLUSTER), 2011 IEEE International Conference on. IEEE, pp 1\u20137","DOI":"10.1109\/CLUSTER.2011.9"},{"issue":"12","key":"2392_CR74","doi-asserted-by":"publisher","first-page":"3730","DOI":"10.1016\/j.camwa.2011.04.012","volume":"61","author":"M Sch\u00f6nherr","year":"2011","unstructured":"Sch\u00f6nherr M, Kucher K, Geier M, Stiebler M, Freudiger S, Krafczyk M (2011) Multi-thread implementations of the lattice Boltzmann method on non-uniform grids for CPUs and GPUs. Comput Math Appl 61(12):3730\u20133743","journal-title":"Comput Math Appl"},{"key":"2392_CR75","doi-asserted-by":"publisher","first-page":"984","DOI":"10.1016\/j.procs.2011.04.104","volume":"4","author":"M Schreiber","year":"2011","unstructured":"Schreiber M, Neumann P, Zimmer S, Bungartz HJ (2011) Free-surface lattice-Boltzmann simulation on many-core architectures. Proc Comput Sci 4:984\u2013993. \n                    https:\/\/doi.org\/10.1016\/j.procs.2011.04.104","journal-title":"Proc Comput Sci"},{"key":"2392_CR76","doi-asserted-by":"crossref","unstructured":"Stam J (1999) Stable fluids. In: Proceedings of the 26th Annual Conference on Computer Graphics and Interactive Techniques. ACM Press\/Addison-Wesley Publishing Co, pp 121\u2013128","DOI":"10.1145\/311535.311548"},{"issue":"5","key":"2392_CR77","doi-asserted-by":"publisher","first-page":"723","DOI":"10.1007\/s11432-009-0091-z","volume":"52","author":"J Tan","year":"2009","unstructured":"Tan J, Yang X (2009) Physically-based fluid animation: a survey. Sci China Ser F Inf Sci 52(5):723\u2013740","journal-title":"Sci China Ser F Inf Sci"},{"issue":"1","key":"2392_CR78","doi-asserted-by":"publisher","first-page":"453","DOI":"10.1016\/j.compfluid.2012.01.011","volume":"80","author":"I Tanno","year":"2013","unstructured":"Tanno I, Hashimoto T, Yasuda T, Tanaka Y, Morinishi K, Satofuka N (2013) Simulation of turbulent flow by lattice Boltzmann method and conventional method on a GPU. Comput Fluids 80(1):453\u2013458. \n                    https:\/\/doi.org\/10.1016\/j.compfluid.2012.01.011","journal-title":"Comput Fluids"},{"key":"2392_CR79","doi-asserted-by":"crossref","unstructured":"Tanwar S (2018) A meshfree-based lattice Boltzmann approach for simulation of fluid flows within complex geometries: application of meshfree methods for LBM simulations. In: Analysis and applications of lattice Boltzmann simulations. IGI Global, pp 188\u2013222","DOI":"10.4018\/978-1-5225-4760-0.ch006"},{"key":"2392_CR80","unstructured":"Th\u00fcrey N (2007) Physically based animation of free surface flows with the lattice-Boltzmann method, Ph.D. thesis. University of Erlangen-Nuremberg"},{"key":"2392_CR81","unstructured":"Th\u00fcrey N, R\u00fcde U (2004) Free surface lattice-Boltzmann fluid simulations with and without level sets. In: Vision, modeling, and visualization 2004: proceedings, Standford, p 199"},{"issue":"5","key":"2392_CR82","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1007\/s00791-008-0090-4","volume":"12","author":"N Th\u00fcrey","year":"2009","unstructured":"Th\u00fcrey N, R\u00fcde U (2009) Stable free surface flows with the lattice Boltzmann method on adaptively coarsened grids. Comput Vis Sci 12(5):247\u2013263","journal-title":"Comput Vis Sci"},{"issue":"1","key":"2392_CR83","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1007\/s00791-008-0120-2","volume":"13","author":"J T\u00f6lke","year":"2008","unstructured":"T\u00f6lke J (2008) Implementation of a lattice Boltzmann kernel using the compute unified device architecture developed by nVIDIA. Comput Vis Sci 13(1):29\u201339","journal-title":"Comput Vis Sci"},{"issue":"7","key":"2392_CR84","doi-asserted-by":"publisher","first-page":"443","DOI":"10.1080\/10618560802238275","volume":"22","author":"J Tolke","year":"2008","unstructured":"Tolke J, Krafczyk M (2008) Teraflop computing on a desktop PC with GPUs for 3D CFD. Int J Comput Fluid Dyn 22(7):443\u2013456","journal-title":"Int J Comput Fluid Dyn"},{"key":"2392_CR85","doi-asserted-by":"publisher","unstructured":"Tran NP, Lee M, Hong S (2017) Performance optimization of 3D lattice Boltzmann flow solver on a GPU. Sci Program 2017:1205892. \n                    https:\/\/doi.org\/10.1155\/2017\/1205892","DOI":"10.1155\/2017\/1205892"},{"key":"2392_CR86","doi-asserted-by":"crossref","unstructured":"Tripathi N, Narayanan P (2013) Generalized Newtonian fluid simulations. In: Computer Vision, Pattern Recognition, Image Processing and Graphics (NCVPRIPG), 2013 Fourth National Conference on. IEEE, pp 1\u20134","DOI":"10.1109\/NCVPRIPG.2013.6776169"},{"issue":"3","key":"2392_CR87","doi-asserted-by":"publisher","first-page":"316","DOI":"10.1002\/nme.3066","volume":"86","author":"KR Tubbs","year":"2011","unstructured":"Tubbs KR, Tsai FTC (2011) GPU accelerated lattice Boltzmann model for shallow water flow and mass transport. Int J Numer Methods Eng 86(3):316\u2013334","journal-title":"Int J Numer Methods Eng"},{"issue":"24","key":"2392_CR88","doi-asserted-by":"publisher","first-page":"e4221","DOI":"10.1002\/cpe.4221","volume":"29","author":"P Valero-Lara","year":"2017","unstructured":"Valero-Lara P (2017) Reducing memory requirements for large size LBM simulations on GPUs. Concurr Comput Pract Exp 29(24):e4221. \n                    https:\/\/doi.org\/10.1002\/cpe.4221","journal-title":"Concurr Comput Pract Exp"},{"issue":"3","key":"2392_CR89","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11432-013-4816-7","volume":"56","author":"C Wang","year":"2013","unstructured":"Wang C, Zhang Q, Kong F (2013) Simulation of free-surface flow using a boundless grid. Sci China Inf Sci 56(3):1\u201310","journal-title":"Sci China Inf Sci"},{"key":"2392_CR90","doi-asserted-by":"publisher","first-page":"192","DOI":"10.1016\/j.compfluid.2015.04.004","volume":"115","author":"Z Wang","year":"2015","unstructured":"Wang Z, Zhao Y, Sawchuck AP, Dalsing MC, Yu H (2015) GPU acceleration of volumetric lattice Boltzmann method for patient-specific computational hemodynamics. Comput Fluids 115:192\u2013200. \n                    https:\/\/doi.org\/10.1016\/j.compfluid.2015.04.004","journal-title":"Comput Fluids"},{"key":"2392_CR91","unstructured":"Wei X, Zhao Y, Fan Z, Li W, Yoakum-Stover S, Kaufman A (2003) Blowing in the wind. In: Proceedings of the 2003 ACM SIGGRAPH\/eurographics symposium on computer animation. Eurographics Association, pp 75\u201385"},{"issue":"8","key":"2392_CR92","doi-asserted-by":"publisher","first-page":"910","DOI":"10.1016\/j.compfluid.2005.02.008","volume":"35","author":"G Wellein","year":"2006","unstructured":"Wellein G, Zeiser T, Hager G, Donath S (2006) On the single processor performance of simple lattice Boltzmann kernels. Comput Fluids 35(8):910\u2013919","journal-title":"Comput Fluids"},{"issue":"9","key":"2392_CR93","doi-asserted-by":"publisher","first-page":"521","DOI":"10.1016\/j.parco.2011.02.007","volume":"37","author":"W Xian","year":"2011","unstructured":"Xian W, Takayuki A (2011) Multi-GPU performance of incompressible flow computation by lattice Boltzmann method on GPU cluster. Parallel Comput 37(9):521\u2013535. \n                    https:\/\/doi.org\/10.1016\/j.parco.2011.02.007","journal-title":"Parallel Comput"},{"issue":"7","key":"2392_CR94","doi-asserted-by":"publisher","first-page":"707","DOI":"10.1007\/s11434-011-4908-y","volume":"57","author":"Q Xiong","year":"2012","unstructured":"Xiong Q, Li B, Xu J, Fang X, Wang X, Wang L, He X, Ge W (2012) Efficient parallel implementation of the lattice Boltzmann method on large clusters of graphic processing units. Chin Sci Bull 57(7):707\u2013715","journal-title":"Chin Sci Bull"},{"key":"2392_CR95","doi-asserted-by":"publisher","first-page":"577","DOI":"10.1016\/j.ijheatmasstransfer.2017.02.032","volume":"109","author":"A Xu","year":"2017","unstructured":"Xu A, Shi L, Zhao T (2017) Accelerated lattice Boltzmann simulation using GPU and OpenACC with data management. Int J Heat Mass Transf 109:577\u2013588","journal-title":"Int J Heat Mass Transf"},{"key":"2392_CR96","doi-asserted-by":"publisher","first-page":"241","DOI":"10.1016\/j.compfluid.2013.08.005","volume":"88","author":"Y Ye","year":"2013","unstructured":"Ye Y, Li K (2013) Entropic lattice Boltzmann method based high reynolds number flow simulation using CUDA on GPU. Comput Fluids 88:241\u2013249","journal-title":"Comput Fluids"},{"issue":"3","key":"2392_CR97","doi-asserted-by":"publisher","first-page":"42","DOI":"10.1145\/3024918","volume":"60","author":"M Zahran","year":"2017","unstructured":"Zahran M (2017) Heterogeneous computing: here to stay. Commun ACM 60(3):42\u201345","journal-title":"Commun ACM"},{"key":"2392_CR98","doi-asserted-by":"crossref","unstructured":"Zhang J, Yuasa S, Fukuma S, Mori SI (2016) A real-time GPU-based coupled fluid-structure simulation with haptic interaction. In: Computer and Information Science (ICIS), 2016 IEEE\/ACIS 15th International Conference on. IEEE, pp 1\u20136","DOI":"10.1109\/ICIS.2016.7550842"},{"issue":"5","key":"2392_CR99","doi-asserted-by":"publisher","first-page":"323","DOI":"10.1007\/s00371-007-0191-y","volume":"24","author":"Y Zhao","year":"2008","unstructured":"Zhao Y (2008) Lattice Boltzmann based PDE solver on the GPU. Vis Comput 24(5):323\u2013333","journal-title":"Vis Comput"},{"issue":"1","key":"2392_CR100","doi-asserted-by":"publisher","first-page":"179","DOI":"10.1109\/TVCG.2007.24","volume":"13","author":"Y Zhao","year":"2007","unstructured":"Zhao Y, Han Y, Fan Z, Qiu F, Kuo YC, Kaufman AE, Mueller K (2007) Visual simulation of heat shimmering and mirage. IEEE Trans Vis Comput Graph 13(1):179\u2013189","journal-title":"IEEE Trans Vis Comput Graph"},{"key":"2392_CR101","doi-asserted-by":"crossref","unstructured":"Zhao Y, Qiu F, Fan Z, Kaufman A (2007) Flow simulation with locally-refined LBM. In: Proceedings of the 2007 symposium on interactive 3D graphics and games. ACM, pp. 181\u2013188","DOI":"10.1145\/1230100.1230132"},{"issue":"4","key":"2392_CR102","doi-asserted-by":"publisher","first-page":"519","DOI":"10.1016\/j.cag.2006.03.009","volume":"30","author":"Y Zhao","year":"2006","unstructured":"Zhao Y, Wang L, Qiu F, Kaufman A, Mueller K (2006) Melting and flowing in multiphase environment. Comput Graph (Pergamon) 30(4):519\u2013528","journal-title":"Comput Graph (Pergamon)"},{"issue":"3\u20134","key":"2392_CR103","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1002\/cav.143","volume":"17","author":"H Zhu","year":"2006","unstructured":"Zhu H, Liu X, Liu Y, Wu E (2006) Simulation of miscible binary mixtures based on lattice Boltzmann method. Comput Anim Virtual Worlds 17(3\u20134):403\u2013410","journal-title":"Comput Anim Virtual Worlds"}],"container-title":["The Journal of Supercomputing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11227-018-2392-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-018-2392-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-018-2392-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,4,27]],"date-time":"2019-04-27T03:26:07Z","timestamp":1556335567000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11227-018-2392-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,4,27]]},"references-count":103,"journal-issue":{"issue":"7","published-print":{"date-parts":[[2018,7]]}},"alternative-id":["2392"],"URL":"https:\/\/doi.org\/10.1007\/s11227-018-2392-8","relation":{},"ISSN":["0920-8542","1573-0484"],"issn-type":[{"value":"0920-8542","type":"print"},{"value":"1573-0484","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,4,27]]},"assertion":[{"value":"27 April 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}