{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,15]],"date-time":"2025-10-15T10:28:47Z","timestamp":1760524127372,"version":"3.37.3"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"14","license":[{"start":{"date-parts":[[2021,1,2]],"date-time":"2021-01-02T00:00:00Z","timestamp":1609545600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,2]],"date-time":"2021-01-02T00:00:00Z","timestamp":1609545600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"name":"China National Key Research Project","award":["2019YFC0312003"],"award-info":[{"award-number":["2019YFC0312003"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61402532"],"award-info":[{"award-number":["61402532"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Neural Comput &amp; Applic"],"published-print":{"date-parts":[[2021,7]]},"DOI":"10.1007\/s00521-020-05602-2","type":"journal-article","created":{"date-parts":[[2021,1,2]],"date-time":"2021-01-02T20:02:39Z","timestamp":1609617759000},"page":"8495-8511","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["Incorporating Actor-Critic in Monte Carlo tree search for symbolic regression"],"prefix":"10.1007","volume":"33","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8217-2305","authenticated-orcid":false,"given":"Qiang","family":"Lu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fan","family":"Tao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shuo","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhiguang","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,1,2]]},"reference":[{"key":"5602_CR1","volume-title":"Gene Expression Programming-Mathematical Modeling by an Artificial Intelligence","author":"Candida Ferreira","year":"2016","unstructured":"Ferreira Candida (2016) Gene Expression Programming-Mathematical Modeling by an Artificial Intelligence. Springer, Berlin"},{"key":"5602_CR2","volume-title":"Genetic Programming II, Automatic Discovery of Reusable Subprograms","author":"John R Koza","year":"1992","unstructured":"Koza John R (1992) Genetic Programming II, Automatic Discovery of Reusable Subprograms. MIT Press, Cambridge, MA"},{"key":"5602_CR3","first-page":"109","volume-title":"Genetic Programming Theory and Practice VIII no. 8 in Genetic and Evolutionary Computation","author":"Michael F Korns","year":"2011","unstructured":"Korns Michael F (2011) Abstract Expression Grammar Symbolic Regression. In: Riolo Rick, McConaghy Trent, Vladislavleva Ekaterina (eds) Genetic Programming Theory and Practice VIII no. 8 in Genetic and Evolutionary Computation. Springer, New York, pp. 109\u2013128"},{"key":"5602_CR4","first-page":"129","volume-title":"Genetic Programming Theory and Practice VIII, no.8 in Genetic and Evolutionary Computation","author":"Michael Schmidt","year":"2011","unstructured":"Schmidt Michael, Lipson Hod (2011) Age-Fitness Pareto Optimization. In: Riolo Rick, McConaghy Trent, Vladislavleva Ekaterina (eds) Genetic Programming Theory and Practice VIII, no.8 in Genetic and Evolutionary Computation. Springer, New York, pp. 129\u2013146"},{"issue":"5","key":"5602_CR5","doi-asserted-by":"publisher","first-page":"1165","DOI":"10.1109\/72.623217","volume":"8","author":"Yee Leung","year":"1997","unstructured":"Leung Yee, Gao Yong, Zong-Ben Xu (1997) Degree of population diversity : a perspective on premature convergence in genetic algorithms and its markov chain analysis. IEEE Trans Neural Netw 8(5):1165\u20131176","journal-title":"IEEE Trans Neural Netw"},{"key":"5602_CR6","volume-title":"Differential evolution: a practical approach to global optimization","author":"KV Price","year":"2005","unstructured":"Price KV, Storn RM, Lampinen JA (2005) Differential evolution: a practical approach to global optimization. Springer, Berlin"},{"issue":"1","key":"5602_CR7","doi-asserted-by":"publisher","first-page":"65","DOI":"10.1109\/TEVC.2015.2424410","volume":"20","author":"J Zhong","year":"2016","unstructured":"Zhong J, Ong YS, Cai W (2016) Self-learning gene expression programming. IEEE Trans Evolution Comput 20(1):65\u201380","journal-title":"IEEE Trans Evolution Comput"},{"doi-asserted-by":"crossref","unstructured":"Hansen N (2006) The cma evolution strategy: a comparing review. In: Towards a new evolutionary computation. Springer, pp 75\u2013102 (2006)","key":"5602_CR8","DOI":"10.1007\/11007937_4"},{"doi-asserted-by":"crossref","unstructured":"Ilknur Icke, Joshua C. Bongard: Improving genetic programming based symbolic regression using deterministic machine learning. In: Evolutionary Computation (CEC), 2013 IEEE Congress on, pp. 1763\u20131770. IEEE (2013)","key":"5602_CR9","DOI":"10.1109\/CEC.2013.6557774"},{"issue":"3","key":"5602_CR10","doi-asserted-by":"publisher","first-page":"391","DOI":"10.1007\/s10723-014-9320-9","volume":"13","author":"Kalyan Veeramachaneni","year":"2015","unstructured":"Veeramachaneni Kalyan, Arnaldo Ignacio, Derby Owen, Oreilly Una-May (2015) Flexgp: cloud-based ensemble learning with genetic programming for large regression problems. J Grid Comput 13(3):391\u2013407","journal-title":"J Grid Comput"},{"key":"5602_CR11","first-page":"235","volume-title":"Ffx Fast, scalable, deterministic symbolic regression technology. Genetic Programming Theory and Practice IX","author":"T McConaghy","year":"2011","unstructured":"McConaghy T (2011) Ffx Fast, scalable, deterministic symbolic regression technology. Genetic Programming Theory and Practice IX. Springer, Berlin, pp. 235\u2013260"},{"issue":"454","key":"5602_CR12","doi-asserted-by":"publisher","first-page":"574","DOI":"10.1198\/016214501753168262","volume":"96","author":"Yuhong Yang","year":"2001","unstructured":"Yang Yuhong (2001) Adaptive regression by mixing. J Am Statist Assoc 96(454):574\u2013588","journal-title":"J Am Statist Assoc"},{"doi-asserted-by":"crossref","unstructured":"Giorgos Karafotias, A.E. Eiben, Mark Hoogendoorn: Generic parameter control with reinforcement learning. In: Proceedings of the 2014 Annual Conference on Genetic and Evolutionary Computation, pp. 1319\u20131326. ACM (2014)","key":"5602_CR13","DOI":"10.1145\/2576768.2598360"},{"issue":"3","key":"5602_CR14","doi-asserted-by":"publisher","first-page":"259","DOI":"10.1023\/A:1011953410319","volume":"2","author":"L Keith","year":"2001","unstructured":"Keith L (2001) Downing: reinforced genetic programming. Genetic Programm Evol Mach 2(3):259\u2013288","journal-title":"Genetic Programm Evol Mach"},{"issue":"3","key":"5602_CR15","doi-asserted-by":"publisher","first-page":"369","DOI":"10.1162\/evco.2007.15.3.369","volume":"15","author":"Shingo Mabu","year":"2007","unstructured":"Mabu Shingo, Hirasawa Kotaro, Jinglu Hu (2007) A graph-based evolutionary algorithm: Genetic network programming (gnp) and its extension using reinforcement learning. Evolution Comput 15(3):369\u2013398","journal-title":"Evolution Comput"},{"issue":"1","key":"5602_CR16","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1109\/TEVC.2003.819263","volume":"8","author":"E Burke","year":"2004","unstructured":"Burke E, Gustafson S, Kendall G (2004) Diversity in genetic programming: an analysis of measures and correlation with fitness. IEEE Trans Evolution Comput 8(1):47\u201362","journal-title":"IEEE Trans Evolution Comput"},{"doi-asserted-by":"crossref","unstructured":"Sudholt D (2018) The Benefits of Population Diversity in Evolutionary Algorithms: A Survey of Rigorous Runtime Analyses. arXiv:1801.10087 [cs]","key":"5602_CR17","DOI":"10.1007\/978-3-030-29414-4_8"},{"issue":"3","key":"5602_CR18","doi-asserted-by":"publisher","first-page":"35:1","DOI":"10.1145\/2480741.2480752","volume":"45","author":"M \u010crepin\u0161ek","year":"2013","unstructured":"\u010crepin\u0161ek M, Liu SH, Mernik M (2013) Exploration and exploitation in evolutionary algorithms: a survey. ACM Comput Surv 45(3):35:1\u201335:33","journal-title":"ACM Comput Surv"},{"issue":"6","key":"5602_CR19","doi-asserted-by":"publisher","first-page":"741","DOI":"10.1109\/TEVC.2010.2040180","volume":"15","author":"CK Chow","year":"2011","unstructured":"Chow CK, Yuen SY (2011) An evolutionary algorithm that makes decision based on the entire previous search history. IEEE Trans Evolution Comput 15(6):741\u2013769","journal-title":"IEEE Trans Evolution Comput"},{"unstructured":"Yuen SY, Chow CK (2007) A non-revisiting genetic algorithm. In: IEEE Congress on Evolutionary Computation, pp. 4583\u20134590","key":"5602_CR20"},{"issue":"2","key":"5602_CR21","doi-asserted-by":"publisher","first-page":"454","DOI":"10.1109\/TEVC.2008.2003008","volume":"13","author":"SY Yuen","year":"2009","unstructured":"Yuen SY, Chow CK (2009) A genetic algorithm that adaptively mutates and never revisits. IEEE Trans Evolution Comput 13(2):454\u2013472","journal-title":"IEEE Trans Evolution Comput"},{"issue":"1","key":"5602_CR22","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TCIAIG.2012.2186810","volume":"4","author":"Cameron Browneand Edward Powley","year":"2012","unstructured":"Powley Cameron Browneand Edward, Whitehouse Daniel, Lucas Simon, Cowling Peter I, Rohlfshagen Philipp, Tavener Stephen, Perez Diego, Samothrakis Spyridon, Colton Simon (2012) A survey of monte carlo tree search methods. IEEE Trans Comput Intell AI Games 4(1):1\u201343","journal-title":"IEEE Trans Comput Intell AI Games"},{"issue":"2\u20133","key":"5602_CR23","doi-asserted-by":"publisher","first-page":"235","DOI":"10.1023\/A:1013689704352","volume":"47","author":"Peter Auer","year":"2002","unstructured":"Auer Peter, Cesa-Bianchi Nicol, Fischer Paul (2002) Finite-time analysis of the multiarmed bandit problem. Mach Learn 47(2\u20133):235\u2013256","journal-title":"Mach Learn"},{"key":"5602_CR24","volume-title":"Reinforcement Learning: An Introduction(2nd)","author":"Richard S Sutton","year":"2018","unstructured":"Sutton Richard S, Barto Andrew G (2018) Reinforcement Learning: An Introduction(2nd). The MIT Press, Cambbridge"},{"issue":"4","key":"5602_CR25","doi-asserted-by":"publisher","first-page":"1143","DOI":"10.1137\/S0363012901385691","volume":"42","author":"K Vijaymohan","year":"2003","unstructured":"Vijaymohan K (2003) Actor-critic algorithms. Siam J Control Optimiz 42(4):1143\u20131166","journal-title":"Siam J Control Optimiz"},{"unstructured":"Kennedy James, Eberhart Russell C (1995) Particle swarm optimization. Proceedings of ICNN\u201995\u2014International Conference on Neural Networks 4(0):1942\u20131948","key":"5602_CR26"},{"issue":"7","key":"5602_CR27","doi-asserted-by":"publisher","first-page":"1207","DOI":"10.1109\/TMC.2011.141","volume":"11","author":"S Milner","year":"2012","unstructured":"Milner S, Davis C, Zhang H, Llorca J (2012) Nature-inspired self-organization, control, and optimization in heterogeneous wireless networks. IEEE Trans Mob Comput 11(7):1207\u20131222","journal-title":"IEEE Trans Mob Comput"},{"issue":"7587","key":"5602_CR28","doi-asserted-by":"publisher","first-page":"484","DOI":"10.1038\/nature16961","volume":"529","author":"David Silver","year":"2016","unstructured":"Silver David, Huang Aja, Maddison Chris J, Guez Arthur, Sifre Laurent, van den Driessche George, Schrittwieser Julian, Antonoglou Ioannis, Panneershelvam Veda, Lanctot M, Dieleman S, Grewe D, Nham J, Kalchbrenner N, Sutskever I, Lillicrap T, Leach M, Kavukcuoglu K, Graepel T, Hassabis D (2016) Mastering the game of Go with deep neural networks and tree search. Nature 529(7587):484\u2013489","journal-title":"Nature"},{"doi-asserted-by":"crossref","unstructured":"Levente Kocsis, Csaba Szepesv\u00e1ri (2006) Bandit Based Monte-Carlo Planning. In: Machine Learning: ECML 2006, Lecture Notes in Computer Science, pp. 282\u2013293. Springer","key":"5602_CR29","DOI":"10.1007\/11871842_29"},{"issue":"6","key":"5602_CR30","doi-asserted-by":"publisher","first-page":"26","DOI":"10.1109\/MSP.2017.2743240","volume":"34","author":"Arulkumaran Kai","year":"2017","unstructured":"Kai Arulkumaran (2017) Marc Peter Deisenroth, Miles Brundage Anil, Anthony Bharath: Deep Reinforcement Learning: A Brief Survey. IEEE Signal Process Mag 34(6):26\u201338","journal-title":"IEEE Signal Process Mag"},{"issue":"3\u20134","key":"5602_CR31","first-page":"279","volume":"8","author":"JCH Christopher","year":"1992","unstructured":"Christopher JCH (1992) Watkins. Peter Dayan: Tech note:q-learn Mach learn 8(3\u20134):279\u2013292","journal-title":"Peter Dayan: Tech note:q-learn Mach learn"},{"key":"5602_CR32","volume-title":"Mahesan Niranjan: On-line Q-learning using connectionist systems","author":"Gavin Adrian Rummery","year":"1994","unstructured":"Gavin Adrian Rummery (1994) Mahesan Niranjan: On-line Q-learning using connectionist systems, vol 37. University of Cambridge, Department of Engineering, Cambridge"},{"key":"5602_CR33","first-page":"117","volume-title":"Genetic Programming Theory and Practice X, Genetic and Evolutionary Computation","author":"F Michael","year":"2013","unstructured":"Michael F (2013) Korns: A Baseline Symbolic Regression Algorithm. In: Riolo Rick, Vladislavleva Ekaterina, Ritchie Marylyn D, Moore Jason H (eds) Genetic Programming Theory and Practice X, Genetic and Evolutionary Computation. Springer, New York, pp. 117\u2013137"},{"unstructured":"Goodfellow I, Bengio Y, Courville A (2016) Deep learning. The MIT Press","key":"5602_CR34"},{"issue":"1","key":"5602_CR35","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1007\/s10710-012-9177-2","volume":"14","author":"David R White","year":"2013","unstructured":"White David R, McDermott James, Castelli Mauro, Manzoni Luca, Goldman Brian W, Kronberger Gabriel, Ja\u015bkowski Wojciech, O\u2019Reilly Una-May, Luke Sean (2013) Better GP benchmarks: community survey results and proposals. Genet Program Evolv Mach 14(1):3\u201329","journal-title":"Genet Program Evolv Mach"},{"doi-asserted-by":"crossref","unstructured":"Maarten Keijzer (2003) Improving Symbolic Regression with Interval Arithmetic and Linear Scaling. In: Conor Ryan, Terence Soule, Maarten Keijzer, Edward Tsang, Riccardo Poli, Ernesto Costa (eds.) Genetic Programming, no. 2610 in Lecture Notes in Computer Science, pp. 70\u201382. Springer Berlin Heidelberg","key":"5602_CR36","DOI":"10.1007\/3-540-36599-0_7"},{"doi-asserted-by":"crossref","unstructured":"Ju\u00e1rez-Smith P, Trujillo L (2016) Integrating Local Search within neat-GP. In: Proceedings of the 2016 on Genetic and Evolutionary Computation Conference, GECCO \u201917. ACM","key":"5602_CR37","DOI":"10.1145\/2908961.2931659"},{"doi-asserted-by":"publisher","unstructured":"White DR, Yoo S, Singer J (2015) The Programming Game: Evaluating MCTS as an Alternative to GP for Symbolic Regression. In: Proceedings of the Companion Publication of the 2015 on Genetic and Evolutionary Computation Conference\u2014GECCO Companion\u2019 15, pp. 1521\u20131522. ACM Press, Madrid, Spain. https:\/\/doi.org\/10.1145\/2739482.2764655","key":"5602_CR38","DOI":"10.1145\/2739482.2764655"},{"key":"5602_CR39","doi-asserted-by":"publisher","first-page":"13","DOI":"10.1007\/978-1-4471-0427-8_2","volume-title":"Soft Computing in Engineering Design and Manufacturing","author":"WB Langdon","year":"1998","unstructured":"Langdon WB, Poli R (1998) Fitness Causes Bloat. In: Roy R (ed) Soft Computing in Engineering Design and Manufacturing. Springer, London, pp. 13\u201322"},{"key":"5602_CR40","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1016\/j.ins.2015.11.010","volume":"333","author":"L Trujillo","year":"2016","unstructured":"Trujillo L, Mu\u00f1oz L, Galv\u01cen-L\u01d2pez E, Silva S (2016) Neat Genetic Programming: Controlling bloat naturally. Information Sciences 333:21\u201343","journal-title":"Information Sciences"},{"unstructured":"Cazenave T, Monte-Carlo expression discovery","key":"5602_CR41"},{"doi-asserted-by":"crossref","unstructured":"Cazenave, T.: Monte-carlo expression discovery. Int J Artif Intell Tools 22(1) (2013)","key":"5602_CR42","DOI":"10.1142\/S0218213012500352"},{"issue":"7676","key":"5602_CR43","doi-asserted-by":"publisher","first-page":"354","DOI":"10.1038\/nature24270","volume":"550","author":"D Silver","year":"2017","unstructured":"Silver D, Schrittwieser J, Simonyan K, Antonoglou I, Huang A, Guez A, Hubert T, Baker L, Lai M, Bolton A, Chen Y, Lillicrap T, Hui F, Sifre L, van den Driessche G, Graepel T, Hassabis D (2017) Mastering the game of Go without human knowledge. Nature 550(7676):354\u2013359","journal-title":"Nature"},{"issue":"2","key":"5602_CR44","doi-asserted-by":"publisher","first-page":"301","DOI":"10.1111\/j.1467-9868.2005.00503.x","volume":"67","author":"Hui Zou","year":"2005","unstructured":"Zou Hui, Hastie Trevor (2005) Regularization and variable selection via the elastic net. J R Stat Soc: Ser B (Stat Methodo) 67(2):301\u2013320","journal-title":"J R Stat Soc: Ser B (Stat Methodo)"},{"doi-asserted-by":"crossref","unstructured":"Edward Haslam, Bing Xue, Mengjie Zhang (2016) Further investigation on genetic programming with transfer learning for symbolic regression. In: Evolutionary Computation (CEC), 2016 IEEE Congress on, pp. 3598\u20133605. IEEE","key":"5602_CR45","DOI":"10.1109\/CEC.2016.7744245"},{"doi-asserted-by":"crossref","unstructured":"Thi Thu Huong Dinh, Thi Huong Chu, Quang Uy Nguyen (2015) Transfer learning in genetic programming. In: Evolutionary Computation (CEC), 2015 IEEE Congress on, pp. 1145\u20131151. IEEE","key":"5602_CR46","DOI":"10.1109\/CEC.2015.7257018"},{"key":"5602_CR47","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2016\/4037380","volume":"2016","author":"Lu Qiang","year":"2016","unstructured":"Qiang Lu, Ren Jun, Wang Zhiguang (2016) Using genetic programming with prior formula knowledge to solve symbolic regression problem. Comput Intell Neurosci 2016:1","journal-title":"Comput Intell Neurosci"},{"doi-asserted-by":"crossref","unstructured":"Pak-Kan Wong, Leung-Yau Lo, Man-Leung Wong, Kwong-Sak Leung (2014) Grammar-based genetic programming with bayesian network. In: Evolutionary Computation (CEC), 2014 IEEE Congress on, pp. 739\u2013746. IEEE","key":"5602_CR48","DOI":"10.1109\/CEC.2014.6900423"},{"doi-asserted-by":"crossref","unstructured":"Sotto LFDP, de\u00a0Melo VV (2017) A Probabilistic Linear Genetic Programming with Stochastic Context-free Grammar for Solving Symbolic Regression Problems. In: Proceedings of the Genetic and Evolutionary Computation Conference, GECCO \u201917, pp. 1017\u20131024. ACM","key":"5602_CR49","DOI":"10.1145\/3071178.3071325"},{"doi-asserted-by":"crossref","unstructured":"Lattimore T, Szepesv\u00e1ri C (2020) Bandit algorithms. Cambridge University Press","key":"5602_CR50","DOI":"10.1017\/9781108571401"}],"container-title":["Neural Computing and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00521-020-05602-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00521-020-05602-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00521-020-05602-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,6,22]],"date-time":"2021-06-22T21:14:06Z","timestamp":1624396446000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00521-020-05602-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,1,2]]},"references-count":50,"journal-issue":{"issue":"14","published-print":{"date-parts":[[2021,7]]}},"alternative-id":["5602"],"URL":"https:\/\/doi.org\/10.1007\/s00521-020-05602-2","relation":{},"ISSN":["0941-0643","1433-3058"],"issn-type":[{"type":"print","value":"0941-0643"},{"type":"electronic","value":"1433-3058"}],"subject":[],"published":{"date-parts":[[2021,1,2]]},"assertion":[{"value":"29 May 2020","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 December 2020","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 January 2021","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Compliance with ethical standards"}},{"value":"Qiang Lu, Fan Tao, Shuo Zhou and Zhiguang Wang declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}