{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,24]],"date-time":"2026-01-24T05:56:02Z","timestamp":1769234162679,"version":"3.49.0"},"reference-count":51,"publisher":"Springer Science and Business Media LLC","issue":"31","license":[{"start":{"date-parts":[[2023,7,19]],"date-time":"2023-07-19T00:00:00Z","timestamp":1689724800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,7,19]],"date-time":"2023-07-19T00:00:00Z","timestamp":1689724800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Neural Comput &amp; Applic"],"published-print":{"date-parts":[[2025,11]]},"DOI":"10.1007\/s00521-023-08802-8","type":"journal-article","created":{"date-parts":[[2023,7,19]],"date-time":"2023-07-19T00:02:08Z","timestamp":1689724928000},"page":"25601-25617","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Language model-accelerated deep symbolic optimization"],"prefix":"10.1007","volume":"37","author":[{"given":"Felipe Leno","family":"da Silva","sequence":"first","affiliation":[]},{"given":"Andre","family":"Goncalves","sequence":"additional","affiliation":[]},{"given":"Sam","family":"Nguyen","sequence":"additional","affiliation":[]},{"given":"Denis","family":"Vashchenko","sequence":"additional","affiliation":[]},{"given":"Ruben","family":"Glatt","sequence":"additional","affiliation":[]},{"given":"Thomas","family":"Desautels","sequence":"additional","affiliation":[]},{"given":"Mikel","family":"Landajuela","sequence":"additional","affiliation":[]},{"given":"Daniel","family":"Faissol","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1841-3888","authenticated-orcid":false,"given":"Brenden","family":"Petersen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,7,19]]},"reference":[{"key":"8802_CR1","first-page":"33985","volume":"35","author":"Q Lu","year":"2016","unstructured":"Lu Q, Ren J, Wang Z (2016) Using genetic programming with prior formula knowledge to solve symbolic regression problem. Comput Intell Neurosci 35:33985\u201333998","journal-title":"Comput Intell Neurosci"},{"key":"8802_CR2","unstructured":"Yu K, Sciuto C, Jaggi M, Musat C, Salzmann M (2020) Evaluating the search phase of neural architecture search. In: International conference on learning representations (ICLR)"},{"key":"8802_CR3","doi-asserted-by":"crossref","unstructured":"Kitzelmann E (2009) Inductive programming: a survey of program synthesis techniques. In: Workshop on approaches and applications of inductive programming, pp 50\u201373","DOI":"10.1007\/978-3-642-11931-6_3"},{"key":"8802_CR4","unstructured":"Petersen BK, Landajuela M, Mundhenk TN, Santiago CP, Kim SK, Kim JT (2021) Deep symbolic regression: recovering mathematical expressions from data via risk-seeking policy gradients. In: Proceeding of the international conference on learning representations (ICLR)"},{"key":"8802_CR5","doi-asserted-by":"publisher","first-page":"645","DOI":"10.1613\/jair.1.11396","volume":"64","author":"FLD Silva","year":"2019","unstructured":"Silva FLD, Costa AHR (2019) A survey on transfer learning for multiagent reinforcement learning systems. J Artif Intell Res (JAIR) 64:645\u2013703","journal-title":"J Artif Intell Res (JAIR)"},{"key":"8802_CR6","unstructured":"Barto AG, Thomas PS, Sutton RS (2017) Some recent applications of reinforcement learning. In: Proceedings of the eighteenth Yale workshop on adaptive and learning systems"},{"key":"8802_CR7","first-page":"4860","volume":"33","author":"S-M Udrescu","year":"2020","unstructured":"Udrescu S-M, Tan A, Feng J, Neto O, Wu T, Tegmark M (2020) Ai Feynman 2.0: Pareto-optimal symbolic regression exploiting graph modularity. Adv Neural Inf Process Syst 33:4860\u20134871","journal-title":"Adv Neural Inf Process Syst"},{"issue":"15","key":"8802_CR8","doi-asserted-by":"publisher","first-page":"3932","DOI":"10.1073\/pnas.1517384113","volume":"113","author":"SL Brunton","year":"2016","unstructured":"Brunton SL, Proctor JL, Kutz JN (2016) Discovering governing equations from data by sparse identification of nonlinear dynamical systems. Proc Natl Acad Sci 113(15):3932\u20133937","journal-title":"Proc Natl Acad Sci"},{"key":"8802_CR9","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1007\/BF00175355","volume":"4","author":"JR Koza","year":"1994","unstructured":"Koza JR (1994) Genetic programming as a means for programming computers by natural selection. Stat Comput 4:87\u2013112","journal-title":"Stat Comput"},{"key":"8802_CR10","first-page":"24912","volume":"34","author":"T Mundhenk","year":"2021","unstructured":"Mundhenk T, Landajuela M, Glatt R, Santiago C, Petersen B et al (2021) Symbolic regression via deep reinforcement learning enhanced genetic programming seeding. Adv Neural Inf Process Syst 34:24912","journal-title":"Adv Neural Inf Process Syst"},{"key":"8802_CR11","first-page":"33985","volume":"35","author":"M Landajuela","year":"2022","unstructured":"Landajuela M, Lee CS, Yang J, Glatt R, Santiago CP, Aravena I, Mundhenk T, Mulcahy G, Petersen BK (2022) A unified framework for deep symbolic regression. Adv Neural Inf Process Syst 35:33985\u201333998","journal-title":"Adv Neural Inf Process Syst"},{"key":"8802_CR12","unstructured":"Landajuela M, Petersen BK, Kim S, Santiago CP, Glatt R, Mundhenk N, Pettit JF, Faissol D (2021) Discovering symbolic policies with deep reinforcement learning. In: International conference on machine learning (ICML). PMLR, pp 5979\u20135989"},{"key":"8802_CR13","unstructured":"Pettit JF, Petersen BK, Cockrell C, Larie DB, Silva FL, An G, Faissol DM (2021) Learning sparse symbolic policies for sepsis treatment. In: Interpretable machine learning in healthcare workshop at ICML"},{"key":"8802_CR14","unstructured":"Glatt R, Silva FLd, Bui VH, Huang C, Xue L, Wang M, Chang F, Murphey Y, Su W (2022) Deep symbolic optimization for electric component sizing in fixed topology power converters. In: Workshop on AI for design and manufacturing (ADAM)"},{"key":"8802_CR15","unstructured":"Devlin J, Chang M, Lee K, Toutanova K (2019) BERT: pre-training of deep bidirectional transformers for language understanding. In: Conference of the North American chapter of the association for computational linguistics: human language technologies, (NAACL-HLT), pp 4171\u20134186"},{"issue":"140","key":"8802_CR16","first-page":"1","volume":"21","author":"C Raffel","year":"2020","unstructured":"Raffel C, Shazeer N, Roberts A, Lee K, Narang S, Matena M, Zhou Y, Li W, Liu PJ (2020) Exploring the limits of transfer learning with a unified text-to-text transformer. J Mach Learn Res 21(140):1\u201367","journal-title":"J Mach Learn Res"},{"issue":"4","key":"8802_CR17","first-page":"1","volume":"13","author":"MT Pilehvar","year":"2020","unstructured":"Pilehvar MT, Camacho-Collados J (2020) Embeddings in natural language processing: theory and advances in vector representations of meaning. Synth Lect Hum Lang Technol 13(4):1\u2013175","journal-title":"Synth Lect Hum Lang Technol"},{"issue":"1","key":"8802_CR18","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40537-016-0043-6","volume":"3","author":"K Weiss","year":"2016","unstructured":"Weiss K, Khoshgoftaar TM, Wang D (2016) A survey of transfer learning. J Big data 3(1):1\u201340","journal-title":"J Big data"},{"issue":"1","key":"8802_CR19","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1007\/s10710-012-9177-2","volume":"14","author":"DR White","year":"2013","unstructured":"White DR, Mcdermott J, Castelli M, Manzoni L, Goldman BW, Kronberger G, Ja\u015bkowski W, O\u2019Reilly U-M, Luke S (2013) Better GP benchmarks: community survey results and proposals. Genet Program Evolvable Mach 14(1):3\u201329","journal-title":"Genet Program Evolvable Mach"},{"key":"8802_CR20","doi-asserted-by":"publisher","first-page":"103","DOI":"10.7717\/peerj-cs.103","volume":"3","author":"A Meurer","year":"2017","unstructured":"Meurer A, Smith CP, Paprocki M, \u010cert\u00edk O, Kirpichev SB, Rocklin M, Kumar A, Ivanov S, Moore JK, Singh S et al (2017) Sympy: symbolic computing in python. PeerJ Comput Sci 3:103","journal-title":"PeerJ Comput Sci"},{"key":"8802_CR21","doi-asserted-by":"crossref","unstructured":"Mikolov T, Karafi\u00e1t M, Burget L, \u010cernock\u1ef3 J, Khudanpur S (2010) Recurrent neural network based language model. In: Eleventh annual conference of the international speech communication association","DOI":"10.21437\/Interspeech.2010-343"},{"issue":"2","key":"8802_CR22","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1007\/s10710-010-9121-2","volume":"12","author":"NQ Uy","year":"2011","unstructured":"Uy NQ, Hoai NX, O\u2019Neill M, McKay RI, Galv\u00e1n-L\u00f3pez E (2011) Semantically-based crossover in genetic programming: application to real-valued symbolic regression. Genet Program Evolvable Mach 12(2):91\u2013119","journal-title":"Genet Program Evolvable Mach"},{"issue":"2","key":"8802_CR23","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1084\/jem.132.2.211","volume":"132","author":"TT Wu","year":"1970","unstructured":"Wu TT, Kabat EA (1970) An analysis of the sequences of the variable regions of Bence Jones proteins and myeloma light chains and their implications for antibody complementarity. J Exp Med 132(2):211\u2013250","journal-title":"J Exp Med"},{"issue":"5","key":"8802_CR24","doi-asserted-by":"publisher","first-page":"343","DOI":"10.1038\/nri1837","volume":"6","author":"PJ Carter","year":"2006","unstructured":"Carter PJ (2006) Potent antibody therapeutics by design. Nat Rev Immunol 6(5):343\u2013357","journal-title":"Nat Rev Immunol"},{"issue":"5","key":"8802_CR25","doi-asserted-by":"publisher","first-page":"1549","DOI":"10.1093\/bib\/bbz095","volume":"21","author":"RA Norman","year":"2019","unstructured":"Norman RA, Ambrosetti F, Bonvin AMJJ, Colwell LJ, Kelm S, Kumar S, Krawczyk K (2019) Computational approaches to therapeutic antibody design: established methods and emerging trends. Brief Bioinform 21(5):1549\u20131567","journal-title":"Brief Bioinform"},{"key":"8802_CR26","doi-asserted-by":"crossref","unstructured":"Desautels T, Zemla A, Lau E, Franco M, Faissol D (2020) Rapid in silico design of antibodies targeting SARS-CoV-2 using machine learning and supercomputing. BioRxiv","DOI":"10.1101\/2020.04.03.024885"},{"key":"8802_CR27","doi-asserted-by":"publisher","first-page":"545","DOI":"10.1016\/B978-0-12-381270-4.00019-6","volume":"487","author":"A Leaver-Fay","year":"2011","unstructured":"Leaver-Fay A, Tyka M, Lewis SM, Lange OF, Thompson J, Jacak R, Kaufman KW, Renfrew PD, Smith CA, Sheffler W et al (2011) ROSETTA3: an object-oriented software suite for the simulation and design of macromolecules. Methods Enzymol 487:545\u2013574","journal-title":"Methods Enzymol"},{"issue":"21","key":"8802_CR28","doi-asserted-by":"publisher","first-page":"5389","DOI":"10.1021\/acs.jpcb.7b11367","volume":"122","author":"KA Barlow","year":"2018","unstructured":"Barlow KA, \u00d3 Conch\u00fair S, Thompson S, Suresh P, Lucas JE, Heinonen M, Kortemme T (2018) Flex ddG: Rosetta ensemble-based estimation of changes in protein-protein binding affinity upon mutation. J Phys Chem B 122(21):5389\u20135399","journal-title":"J Phys Chem B"},{"key":"8802_CR29","first-page":"1257","volume":"18","author":"E Snelson","year":"2006","unstructured":"Snelson E, Ghahramani Z (2006) Sparse Gaussian processes using pseudo-inputs. Adv Neural Inf Process Syst 18:1257","journal-title":"Adv Neural Inf Process Syst"},{"issue":"8","key":"8802_CR30","doi-asserted-by":"publisher","first-page":"2536","DOI":"10.1073\/pnas.0307140101","volume":"101","author":"J Sui","year":"2004","unstructured":"Sui J, Li W, Murakami A, Tamin A, Matthews LJ, Wong SK, Moore MJ, Tallarico ASC, Olurinde M, Choe H et al (2004) Potent neutralization of severe acute respiratory syndrome (SARS) coronavirus by a human mAb to S1 protein that blocks receptor association. Proc Natl Acad Sci 101(8):2536\u20132541","journal-title":"Proc Natl Acad Sci"},{"issue":"5","key":"8802_CR31","doi-asserted-by":"publisher","first-page":"1026","DOI":"10.1016\/j.cell.2018.12.028","volume":"176","author":"AC Walls","year":"2019","unstructured":"Walls AC, Xiong X, Park Y-J, Tortorici MA, Snijder J, Quispe J, Cameroni E, Gopal R, Dai M, Lanzavecchia A et al (2019) Unexpected receptor functional mimicry elucidates activation of coronavirus fusion. Cell 176(5):1026\u20131039","journal-title":"Cell"},{"issue":"29","key":"8802_CR32","doi-asserted-by":"publisher","first-page":"12123","DOI":"10.1073\/pnas.0701000104","volume":"104","author":"Z Zhu","year":"2007","unstructured":"Zhu Z, Chakraborti S, He Y, Roberts A, Sheahan T, Xiao X, Hensley LE, Prabakaran P, Rockx B, Sidorov IA et al (2007) Potent cross-reactive neutralization of SARS coronavirus isolates by human monoclonal antibodies. Proc Natl Acad Sci 104(29):12123\u201312128","journal-title":"Proc Natl Acad Sci"},{"issue":"6","key":"8802_CR33","doi-asserted-by":"publisher","first-page":"926","DOI":"10.1093\/bioinformatics\/btu739","volume":"31","author":"BE Suzek","year":"2014","unstructured":"Suzek BE, Wang Y, Huang H, McGarvey PB, Wu CH (2014) The UniProt Consortium: UniRef clusters: a comprehensive and scalable alternative for improving sequence similarity searches. Bioinformatics 31(6):926\u2013932","journal-title":"Bioinformatics"},{"key":"8802_CR34","doi-asserted-by":"crossref","unstructured":"Steinegger M, Mirdita M, S\u00f6ding J (2018) Protein-level assembly increases protein sequence recovery from metagenomic samples manyfold. bioRxiv","DOI":"10.1101\/386110"},{"key":"8802_CR35","doi-asserted-by":"crossref","unstructured":"Vashchenko D, Nguyen S, Goncalves A, Silva FLd, Petersen B, Desautels T, Faissol D (2022) AbBERT: learning antibody humanness via masked language modeling. In: Workshop on healthcare AI and Covid-19","DOI":"10.1101\/2022.08.02.502236"},{"issue":"1","key":"8802_CR36","doi-asserted-by":"publisher","first-page":"141","DOI":"10.1002\/pro.4205","volume":"31","author":"TH Olsen","year":"2022","unstructured":"Olsen TH, Boyles F, Deane CM (2022) Observed antibody space: a diverse database of cleaned, annotated, and translated unpaired and paired antibody sequences. Protein Sci 31(1):141\u2013146","journal-title":"Protein Sci"},{"key":"8802_CR37","unstructured":"Azunre P (2021) Transfer learning for natural language processing. Simon and Schuster"},{"key":"8802_CR38","doi-asserted-by":"crossref","unstructured":"Pennington J, Socher R, Manning CD (2014) Glove: global vectors for word representation. In: Empirical methods in natural language processing (EMNLP), pp 1532\u20131543","DOI":"10.3115\/v1\/D14-1162"},{"key":"8802_CR39","unstructured":"Mikolov T, Chen K, Corrado G, Dean J (2013) Efficient estimation of word representations in vector space. arXiv:1301.3781 [cs.CL]"},{"key":"8802_CR40","unstructured":"...Brown TB, Mann B, Ryder N, Subbiah M, Kaplan J, Dhariwal P, Neelakantan A, Shyam P, Sastry G, Askell A, Agarwal S, Herbert-Voss A, Krueger G, Henighan T, Child R, Ramesh A, Ziegler DM, Wu J, Winter C, Hesse C, Chen M, Sigler E, Litwin M, Gray S, Chess B, Clark J, Berner C, McCandlish S, Radford A, Sutskever I, Amodei D (2000) Language models are few-shot learners (2020). arXiv:2005.14165 [cs.CL]"},{"key":"8802_CR41","unstructured":"Valipour M, You B, Panju M, Ghodsi A. SymbolicGPT: A generative transformer model for symbolic regression. arXiv:2106.14131"},{"key":"8802_CR42","unstructured":"Reid M, Yamada Y, Gu SS (2022) Can wikipedia help offline reinforcement learning? arXiv:2201.12122"},{"key":"8802_CR43","unstructured":"Chai D, Wu W, Han Q, Wu F, Li J (2020) Description based text classification with reinforcement learning. In: International conference on machine learning (ICML), pp 1371\u20131382"},{"key":"8802_CR44","doi-asserted-by":"crossref","unstructured":"Luketina J, Nardelli N, Farquhar G, Foerster J, Andreas J, Grefenstette E, Whiteson S, Rockt\u00e4schel T (2019) A survey of reinforcement learning informed by natural language. In: International joint conference on artificial intelligence (IJCAI), pp 6309\u20136317","DOI":"10.24963\/ijcai.2019\/880"},{"key":"8802_CR45","unstructured":"Bahdanau D, Hill F, Leike J, Hughes E, Kohli P, Grefenstette E (2019) Learning to understand goal specifications by modelling reward. In: International conference on learning representations (ICRL)"},{"issue":"1","key":"8802_CR46","doi-asserted-by":"publisher","first-page":"849","DOI":"10.1613\/jair.1.11263","volume":"63","author":"K Narasimhan","year":"2018","unstructured":"Narasimhan K, Barzilay R, Jaakkola T (2018) Grounding language for transfer in deep reinforcement learning. J Artif Intell Res (JAIR) 63(1):849\u2013874","journal-title":"J Artif Intell Res (JAIR)"},{"key":"8802_CR47","unstructured":"Bahdanau D, Hill F, Leike J, Hughes E, Kohli P, Grefenstette E (2018) Learning to follow language instructions with adversarial reward induction. arXiv:1806.01946"},{"key":"8802_CR48","unstructured":"Yu H, Zhang H, Xu W (2018) Interactive grounded language acquisition and generalization in a 2D world. In: International conference on learning representations (ICLR)"},{"key":"8802_CR49","unstructured":"Hermann KM, Hill F, Green S, Wang F, Faulkner R, Soyer H, Szepesvari D, Czarnecki WM, Jaderberg M, Teplyashin D, Wainwright M, Apps C, Hassabis D, Blunsom P (2017) Grounded language learning in a simulated 3D world. arXiv:1706.06551"},{"key":"8802_CR50","unstructured":"Kim JT, Larma ML, Petersen BK (2021) Distilling wikipedia mathematical knowledge into neural network models. In: Mathematical reasoning in general artificial intelligence workshop"},{"key":"8802_CR51","unstructured":"Silva FLd, Goncalves A, Nguyen S, Vashchenko D, Glatt R, Desautels T, Landajuela M, Petersen B, Faissol D (2022) Leveraging language models to efficiently learn symbolic optimization solutions. In: Adaptive and learning agents (ALA) workshop"}],"container-title":["Neural Computing and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00521-023-08802-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00521-023-08802-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00521-023-08802-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T05:02:25Z","timestamp":1760850145000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00521-023-08802-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,7,19]]},"references-count":51,"journal-issue":{"issue":"31","published-print":{"date-parts":[[2025,11]]}},"alternative-id":["8802"],"URL":"https:\/\/doi.org\/10.1007\/s00521-023-08802-8","relation":{},"ISSN":["0941-0643","1433-3058"],"issn-type":[{"value":"0941-0643","type":"print"},{"value":"1433-3058","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,7,19]]},"assertion":[{"value":"26 October 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 June 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 July 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}