{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T04:17:16Z","timestamp":1780373836980,"version":"3.54.1"},"reference-count":49,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,12,17]],"date-time":"2025-12-17T00:00:00Z","timestamp":1765929600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,12,17]],"date-time":"2025-12-17T00:00:00Z","timestamp":1765929600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Computing"],"published-print":{"date-parts":[[2026,1]]},"DOI":"10.1007\/s00607-025-01596-8","type":"journal-article","created":{"date-parts":[[2025,12,17]],"date-time":"2025-12-17T08:44:50Z","timestamp":1765961090000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Survey on distributed parallel genetic algorithms for large-scale data analysis"],"prefix":"10.1007","volume":"108","author":[{"given":"Laila","family":"Al-Terkawi","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,12,17]]},"reference":[{"key":"1596_CR1","volume-title":"Genetic Algorithms in Search, Optimization, and Machine Learning","author":"DE Goldberg","year":"1989","unstructured":"Goldberg DE (1989) Genetic Algorithms in Search, Optimization, and Machine Learning. Addison-Wesley, Boston, MA"},{"key":"1596_CR2","volume-title":"Holland","author":"H John","year":"1975","unstructured":"John H (1975) Holland. Adaptation in Natural and Artificial Systems. University of Michigan Press, Ann Arbor, MI"},{"issue":"2","key":"1596_CR3","doi-asserted-by":"publisher","first-page":"65","DOI":"10.1007\/BF00175354","volume":"4","author":"D Whitley","year":"1994","unstructured":"Whitley D (1994) A genetic algorithm tutorial. Stat Comput 4(2):65\u201385. https:\/\/doi.org\/10.1007\/BF00175354","journal-title":"Stat Comput"},{"key":"1596_CR4","volume-title":"An Introduction to Genetic Algorithms","author":"M Mitchell","year":"1998","unstructured":"Mitchell M (1998) An Introduction to Genetic Algorithms. MIT Press, Cambridge, MA, USA (ISBN 0262631857)"},{"key":"1596_CR5","doi-asserted-by":"publisher","DOI":"10.1002\/0471739383","volume-title":"Parallel Metaheuristics: A New Class of Algorithms","author":"E Alba","year":"2005","unstructured":"Alba E (2005) Parallel Metaheuristics: A New Class of Algorithms. Wiley-Interscience, USA (ISBN 0471678066)"},{"key":"1596_CR6","unstructured":"Cantu-Paz E (2000) Efficient and Accurate Parallel Genetic Algorithms. PhD thesis, University of Illinois at Urbana-Champaign"},{"key":"1596_CR7","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2020.106497","volume":"95","author":"H-C Lu","year":"2020","unstructured":"Lu H-C, Hwang FJ, Huang Y-H (2020a) Parallel and distributed architecture of genetic algorithm on apache hadoop and spark. Applied Soft Computing 95:106497. https:\/\/doi.org\/10.1016\/j.asoc.2020.106497","journal-title":"Applied Soft Computing"},{"key":"1596_CR8","doi-asserted-by":"publisher","unstructured":"Verma A, Llora X, Goldberg DE, Campbell RH (2009) Scaling genetic algorithms using mapreduce. In Proceedings of the 2009 Ninth International Conference on Intelligent Systems Design and Applications, ISDA \u201909, pages 13\u201318, Washington, DC, USA. IEEE Computer Society. ISBN 978-0-7695-3872-3. https:\/\/doi.org\/10.1109\/ISDA.2009.181","DOI":"10.1109\/ISDA.2009.181"},{"key":"1596_CR9","unstructured":"Samadi et al (2024) Distributed genetic algorithm for application placement in the cloud-fog continuum. Future Generation Computer Systems"},{"key":"1596_CR10","unstructured":"Maqbool F, Razzaq S, Lehmann J, Jabeen H (2024) Scalable distributed genetic algorithm using apache spark (s-ga). ResearchGate Preprint"},{"issue":"16","key":"1596_CR11","doi-asserted-by":"publisher","first-page":"11469","DOI":"10.1007\/s00500-023-08301-x","volume":"27","author":"Carolina Salto","year":"2023","unstructured":"Salto Carolina, Minetti Gabriela, Alba Enrique, Luque Gabriel (2023a) Big optimization with genetic algorithms: hadoop, spark, and mpi. Soft Comput. 27(16):11469\u201311484. https:\/\/doi.org\/10.1007\/s00500-023-08301-x. (ISSN 1432-7643)","journal-title":"Soft Comput."},{"issue":"16","key":"1596_CR12","doi-asserted-by":"publisher","first-page":"11469","DOI":"10.1007\/s00500-023-08301-x","volume":"27","author":"Carolina Salto","year":"2023","unstructured":"Salto Carolina, Minetti Gabriela, Alba Enrique, Luque Gabriel (2023b) Big optimization with genetic algorithms: hadoop, spark, and mpi. Soft Comput 27(16):11469\u201311484. https:\/\/doi.org\/10.1007\/s00500-023-08301-x. (ISSN 1432-7643)","journal-title":"Soft Comput"},{"key":"1596_CR13","unstructured":"CantA-Paz, E (1998) A survey of parallel genetic algorithms. CALCULATEURS PARALLELES, 10"},{"key":"1596_CR14","doi-asserted-by":"crossref","unstructured":"Alba E, Troya JM (1999) A survey of parallel distributed genetic algorithms. Complex., 4(4):31\u201352. ISSN 1076-2787. https:\/\/doi.org\/10.1002\/(SICI)1099-0526(199903\/04)4:4$$<$$31::AID-CPLX5$$>$$3.0.CO;2-4","DOI":"10.1002\/(SICI)1099-0526(199903\/04)4:4<31::AID-CPLX5>3.0.CO;2-4"},{"issue":"2","key":"1596_CR15","doi-asserted-by":"publisher","first-page":"85","DOI":"10.26599\/BDMA.2019.9020015","volume":"3","author":"MS Mahmud","year":"2020","unstructured":"Mahmud MS, Huang JZ, Salloum S, Emara TZ, Sadatdiynov K (2020) A survey of data partitioning and sampling methods to support big data analysis. Big Data Min Anal 3(2):85\u2013101. https:\/\/doi.org\/10.26599\/BDMA.2019.9020015","journal-title":"Big Data Min Anal"},{"key":"1596_CR16","doi-asserted-by":"publisher","unstructured":"O\u2019Reilly U-M, Wagy M, Hodjat B (2013) EC-Star: A Massive-Scale, Hub and Spoke, Distributed Genetic Programming System, pages 73\u201385. Springer New York, New York, NY. ISBN 978-1-4614-6846-2. https:\/\/doi.org\/10.1007\/978-1-4614-6846-2_6","DOI":"10.1007\/978-1-4614-6846-2_6"},{"key":"1596_CR17","doi-asserted-by":"crossref","unstructured":"Dam HH, Abbass HA, Lokan CJ (2005) Dxcs: an xcs system for distributed data mining. In GECCO","DOI":"10.1145\/1068009.1068326"},{"key":"1596_CR18","unstructured":"Guo Y, R\u00fcger SM, Sutiwaraphun J, Forbes-millott J (1997) Meta-learning for parallel data mining. In Proceedings of the Seventh Parallel Computing Workshop, pages 1\u20132"},{"key":"1596_CR19","doi-asserted-by":"crossref","unstructured":"Sherry D, Veeramachaneni K, McDermott J, O\u2019Reilly U-M (2012) Flex-gp: Genetic programming on the cloud. In Applications of Evolutionary Computation, pages 477\u2013486, Berlin, Heidelberg, Springer Berlin Heidelberg. ISBN 978-3-642-29178-4","DOI":"10.1007\/978-3-642-29178-4_48"},{"issue":"1","key":"1596_CR20","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J Dean","year":"2008","unstructured":"Dean J, Ghemawat S (2008) Mapreduce: simplified data processing on large clusters. Commun ACM 51(1):107\u2013113. https:\/\/doi.org\/10.1145\/1327452.1327492. (ISSN 0001-0782)","journal-title":"Commun ACM"},{"key":"1596_CR21","doi-asserted-by":"publisher","first-page":"417","DOI":"10.1007\/s11390-016-1635-5","volume":"31","author":"R Qi","year":"2016","unstructured":"Qi R, Wang Z-J, Li S-Y (2016) A parallel genetic algorithm based on spark for pairwise test suite generation. J Comput Sci Tech 31:417\u2013427","journal-title":"J Comput Sci Tech"},{"key":"1596_CR22","doi-asserted-by":"publisher","unstructured":"Paduraru C, Melemciuc M-C, Stefanescu A (2017) A distributed implementation using apache spark of a genetic algorithm applied to test data generation. In Proceedings of the Genetic and Evolutionary Computation Conference Companion, GECCO \u201917, pages 1857\u20131863, New York, NY, USA. Association for Computing Machinery. ISBN 9781450349390. https:\/\/doi.org\/10.1145\/3067695.3084219","DOI":"10.1145\/3067695.3084219"},{"key":"1596_CR23","doi-asserted-by":"publisher","unstructured":"Di\u00a0Geronimo L, Ferrucci F, Murolo A, Sarro F (2012) A parallel genetic algorithm based on hadoop mapreduce for the automatic generation of junit test suites. In 2012 IEEE Fifth International Conference on Software Testing, Verification and Validation, pages 785\u2013793. https:\/\/doi.org\/10.1109\/ICST.2012.177","DOI":"10.1109\/ICST.2012.177"},{"key":"1596_CR24","doi-asserted-by":"publisher","unstructured":"Buyya R, Jin C, Vecchiola C (2008) Mrpga: an extension of mapreduce for parallelizing genetic algorithms. In 2008 IEEE Fourth International Conference on eScience, pages 214\u2013221, Indianapolis, IN, USA. ISBN 978-1-4244-3380-3. https:\/\/doi.org\/10.1109\/eScience.2008.78","DOI":"10.1109\/eScience.2008.78"},{"key":"1596_CR25","first-page":"58","volume":"4","author":"N Hans","year":"2015","unstructured":"Hans N, Mahajan S, Omkar S (2015) Big data clustering using genetic algorithm on hadoop mapreduce. Int J Scic Tech Res 4:58\u201362","journal-title":"Int J Scic Tech Res"},{"key":"1596_CR26","doi-asserted-by":"publisher","unstructured":"Kondekar R, Gupta A, Saluja G, Maru R, Rokde AR, Deshpande P (2012) A mapreduce based hybrid genetic algorithm using island approach for solving time dependent vehicle routing problem. In 2012 International Conference on Computer and Information Science (ICCIS), volume\u00a01, pages 263\u2013269. IEEE. https:\/\/doi.org\/10.1109\/ICCISci.2012.6297214","DOI":"10.1109\/ICCISci.2012.6297214"},{"key":"1596_CR27","doi-asserted-by":"publisher","first-page":"290","DOI":"10.1504\/IJCAT.2013.052807","volume":"46","author":"D Xin","year":"2013","unstructured":"Xin D, Ni Y, Yao Z, Xiao R, Xie D (2013) High performance parallel evolutionary algorithm model based on mapreduce framework. IJCAT 46:290\u2013295","journal-title":"IJCAT"},{"key":"1596_CR28","doi-asserted-by":"publisher","unstructured":"Huang D-W, Lin J (2010) Scaling populations of a genetic algorithm for job shop scheduling problems using mapreduce. In 2010 IEEE Second International Conference on Cloud Computing Technology and Science, pages 780\u2013785. https:\/\/doi.org\/10.1109\/CloudCom.2010.18","DOI":"10.1109\/CloudCom.2010.18"},{"key":"1596_CR29","unstructured":"Zaharia M, Chowdhury M, Das T, Dave A, Ma J, McCauley M, Franklin MJ, Shenker S, Stoica I (2012) Resilient distributed datasets: A fault-tolerant abstraction for in-memory cluster computing. In Proceedings of the 9th USENIX Conference on Networked Systems Design and Implementation (NSDI \u201912), pages 15\u201328. USENIX Association"},{"key":"1596_CR30","doi-asserted-by":"publisher","unstructured":"Alterkawi L, Migliavacca M (2019) Parallelism and partitioning in large-scale gas using spark. In Proceedings of the Genetic and Evolutionary Computation Conference, GECCO \u201919, pages 736\u2013744, New York, NY, USA. Association for Computing Machinery. ISBN 9781450361118. https:\/\/doi.org\/10.1145\/3321707.3321775","DOI":"10.1145\/3321707.3321775"},{"issue":"1","key":"1596_CR31","doi-asserted-by":"publisher","first-page":"10836","DOI":"10.1038\/s41598-025-93943-0","volume":"15","author":"L Al-Terkawi","year":"2025","unstructured":"Al-Terkawi L, Migliavacca M (2025) An automated parallel genetic algorithm with parametric adaptation for distributed data analysis. Sci Rep 15(1):10836. https:\/\/doi.org\/10.1038\/s41598-025-93943-0","journal-title":"Sci Rep"},{"issue":"2","key":"1596_CR32","doi-asserted-by":"publisher","first-page":"1089","DOI":"10.1007\/s10586-017-0838-z","volume":"20","author":"H Chengyu","year":"2017","unstructured":"Chengyu H, Ren G, Liu C, Li M, Jie W (2017) A spark-based genetic algorithm for sensor placement in large scale drinking water distribution systems. Clust Comput 20(2):1089\u20131099. https:\/\/doi.org\/10.1007\/s10586-017-0838-z","journal-title":"Clust Comput"},{"key":"1596_CR33","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2020.106497","volume":"95","author":"H-C Lu","year":"2020","unstructured":"Lu H-C, Hwang FJ, Huang Y-H (2020b) Parallel and distributed architecture of genetic algorithm on apache hadoop and spark. Applied Soft Computing 95:106497. https:\/\/doi.org\/10.1016\/j.asoc.2020.106497. (ISSN 1568-4946)","journal-title":"Applied Soft Computing"},{"key":"1596_CR34","doi-asserted-by":"publisher","unstructured":"Cheraghchi F, Iranzad A, Raahemi B (2017) Subspace selection in high-dimensional big data using genetic algorithm in apache spark. In Proceedings of the Second International Conference on Internet of Things, Data and Cloud Computing, ICC \u201917, New York, NY, USA. Association for Computing Machinery. ISBN 9781450347747. https:\/\/doi.org\/10.1145\/3018896.3018950","DOI":"10.1145\/3018896.3018950"},{"key":"1596_CR35","unstructured":"Rivera AJ, Perez-Godoy MD, Pulgar F, del Jesus MJ (2017) Genrbfnspark: A first implementation in spark of a genetic algorithm to rbfn design. In Proceedings of IEEE Congress on Evolutionary Computation, pages 505\u2013512. IEEE"},{"issue":"2","key":"1596_CR36","doi-asserted-by":"publisher","first-page":"1105","DOI":"10.1007\/s10586-019-02954-w","volume":"23","author":"Y Zhang","year":"2020","unstructured":"Zhang Y, Wang L, Chen J, Zhang Yu (2020) Research on distributed model forecasting parallel framework based on adaptive genetic algorithm. Clust Comput 23(2):1105\u20131114. https:\/\/doi.org\/10.1007\/s10586-019-02954-w","journal-title":"Clust Comput"},{"issue":"8","key":"1596_CR37","doi-asserted-by":"publisher","first-page":"7708","DOI":"10.1109\/TITS.2021.3104075","volume":"23","author":"Y Zhang","year":"2022","unstructured":"Zhang Y, Zhou Y, Huapu L, Fujita H (2022) Spark cloud-based parallel computing for traffic network flow predictive control using non-analytical predictive model. IEEE Trans Intell Transp Syst 23(8):7708\u20137720. https:\/\/doi.org\/10.1109\/TITS.2021.3104075","journal-title":"IEEE Trans Intell Transp Syst"},{"key":"1596_CR38","doi-asserted-by":"publisher","unstructured":"Nguyen X-T, Cao P-N, Nguyen V-Q, Kim K, Huynh Q-T (2019) A genetic algorithm for large graph partitioning problem. In Proceedings of the 10th International Symposium on Information and Communication Technology, SoICT \u201919, pages 419\u2013424, New York, NY, USA. Association for Computing Machinery. ISBN 9781450372459. https:\/\/doi.org\/10.1145\/3368926.3369724","DOI":"10.1145\/3368926.3369724"},{"key":"1596_CR39","doi-asserted-by":"publisher","unstructured":"Hmida H, Hamida SB, Borgi A, Rukoz M (2019) Genetic programming over spark for higgs boson classification. In Abramowicz W, Corchuelo R, editors, Business Information Systems - 22nd International Conference, BIS 2019, Seville, Spain, June 26-28, 2019, Proceedings, Part I, volume 353 of Lecture Notes in Business Information Processing, pages 300\u2013312. Springer. https:\/\/doi.org\/10.1007\/978-3-030-20485-3_23","DOI":"10.1007\/978-3-030-20485-3_23"},{"issue":"3","key":"1596_CR40","doi-asserted-by":"publisher","first-page":"2021","DOI":"10.1007\/s10586-020-03162-7","volume":"23","author":"M AlJame","year":"2020","unstructured":"AlJame M, Ahmad I, Alfailakawi M (2020) Apache spark implementation of whale optimization algorithm. Clust Comput 23(3):2021\u20132034. https:\/\/doi.org\/10.1007\/s10586-020-03162-7","journal-title":"Clust Comput"},{"key":"1596_CR41","unstructured":"Samadi et al (2023a) Parallel genetic algorithm for vehicle routing problems. Journal of Big Data. URL https:\/\/journalofbigdata.springeropen.com\/articles\/10.1186\/s40537-023-00681-5. Accessed: 2024-06-12"},{"key":"1596_CR42","unstructured":"Samadi et al (2023b) Comparison of hadoop and spark for genetic algorithms. Journal of Big Data. URL https:\/\/journalofbigdata.springeropen.com\/articles\/10.1186\/s40537-023-00679-9. Accessed: 2024-06-12"},{"issue":"4","key":"1596_CR43","doi-asserted-by":"publisher","first-page":"20","DOI":"10.4018\/IJGHPC.2018100102","volume":"10","author":"M Bouaziz","year":"2018","unstructured":"Bouaziz M, Mahdi A, Mahammed LH, Bounour N (2018) A grammar-guided genetic programming algorithm for associative classification in big data. Int J Grid High Perform Comput (IJGHPC) 10(4):20\u201338. https:\/\/doi.org\/10.4018\/IJGHPC.2018100102","journal-title":"Int J Grid High Perform Comput (IJGHPC)"},{"key":"1596_CR44","doi-asserted-by":"publisher","unstructured":"Rocklin M (2015) Dask: Parallel computation with blocked algorithms and task scheduling. In Proceedings of the 14th Python in Science Conference, pages 130\u2013136. https:\/\/doi.org\/10.25080\/Majora-7b98e3ed-013","DOI":"10.25080\/Majora-7b98e3ed-013"},{"key":"1596_CR45","unstructured":"Augspurger T (2018) Distributed auto-ml with tpot using dask. https:\/\/tomaugspurger.net\/posts\/distributed-tpot\/. Blog post demonstrating TPOT with Dask on an 80-core cluster"},{"key":"1596_CR46","unstructured":"Moritz P, Nishihara R, Wang S, Tumanov A, Liaw R, Liang E, Elibol M, Yang Z, Paul W, Jordan MI, Stoica I (2018) Ray: A distributed framework for emerging ai applications. In Proceedings of the 13th USENIX Symposium on Operating Systems Design and Implementation (OSDI), pages 561\u2013577"},{"key":"1596_CR47","unstructured":"DMTSource (2020) deap_ray: Ray-based map function for deap. https:\/\/github.com\/DMTSource\/deap_ray. GitHub repository providing Ray integration with DEAP"},{"key":"1596_CR48","unstructured":"Ray Project Contributors (2025) Ray tune: Population-based training for hyperparameter optimization. https:\/\/docs.ray.io. Documentation of PBT support in Ray Tune"},{"key":"1596_CR49","doi-asserted-by":"crossref","unstructured":"Lange RT (2022) evosax: Jax-based evolution strategies. arXiv preprint arXiv:2212.04180","DOI":"10.1145\/3583133.3590733"}],"container-title":["Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00607-025-01596-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00607-025-01596-8","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00607-025-01596-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,31]],"date-time":"2026-01-31T05:19:07Z","timestamp":1769836747000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00607-025-01596-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,17]]},"references-count":49,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,1]]}},"alternative-id":["1596"],"URL":"https:\/\/doi.org\/10.1007\/s00607-025-01596-8","relation":{},"ISSN":["0010-485X","1436-5057"],"issn-type":[{"value":"0010-485X","type":"print"},{"value":"1436-5057","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,12,17]]},"assertion":[{"value":"12 May 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 November 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 December 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The author declare no Conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not applicable. This study did not involve human participants, human data, or animals.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval and consent to participate"}}],"article-number":"6"}}