{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,10]],"date-time":"2026-04-10T17:16:21Z","timestamp":1775841381877,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":40,"publisher":"ACM","funder":[{"name":"the National Natural Science Foundation of China","award":["62422605"],"award-info":[{"award-number":["62422605"]}]},{"name":"the National Natural Science Foundation of China","award":["62533021"],"award-info":[{"award-number":["62533021"]}]},{"name":"the National Natural Science Foundation of China","award":["92370132"],"award-info":[{"award-number":["92370132"]}]},{"name":"the Fundamental Research Program of Shanxi Province","award":["202503021212091"],"award-info":[{"award-number":["202503021212091"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,4,13]]},"DOI":"10.1145\/3774904.3792816","type":"proceedings-article","created":{"date-parts":[[2026,4,9]],"date-time":"2026-04-09T21:54:39Z","timestamp":1775771679000},"page":"8150-8161","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["AFE-Master: Enhancing LLM-Driven Autonomous Feature Engineering with Domain-Specific Language Parsing and Guided Local Search"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0000-8371-2297","authenticated-orcid":false,"given":"Hebin","family":"Liang","sequence":"first","affiliation":[{"name":"Tianjin University, Tianjin, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0422-8235","authenticated-orcid":false,"given":"Jianye","family":"Hao","sequence":"additional","affiliation":[{"name":"Tianjin University, Tianjin, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4537-348X","authenticated-orcid":false,"given":"Jinyi","family":"Liu","sequence":"additional","affiliation":[{"name":"Tianjin University, Tianjin, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9375-6605","authenticated-orcid":false,"given":"Yi","family":"Ma","sequence":"additional","affiliation":[{"name":"Shanxi University, Taiyuan, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-4916-3481","authenticated-orcid":false,"given":"Zilin","family":"Cao","sequence":"additional","affiliation":[{"name":"Tianjin University, Tianjin, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-7042-0389","authenticated-orcid":false,"given":"Jing","family":"Liang","sequence":"additional","affiliation":[{"name":"Tianjin University, Tianjin, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0965-4302","authenticated-orcid":false,"given":"Kun","family":"Shao","sequence":"additional","affiliation":[{"name":"Huawei Noah's Ark Lab, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1811-129X","authenticated-orcid":false,"given":"Zhaocheng","family":"Du","sequence":"additional","affiliation":[{"name":"Huawei Noah's Ark Lab, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-5623-2782","authenticated-orcid":false,"given":"Fei","family":"Ni","sequence":"additional","affiliation":[{"name":"Imperial College London, London, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-2194-942X","authenticated-orcid":false,"given":"Yifu","family":"Yuan","sequence":"additional","affiliation":[{"name":"Tianjin University, Tianjin, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5016-6549","authenticated-orcid":false,"given":"Yan","family":"Zheng","sequence":"additional","affiliation":[{"name":"Tianjin Unibersity, Tianjin, China"}]}],"member":"320","published-online":{"date-parts":[[2026,4,12]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"LLM-FE: Automated Feature Engineering for Tabular Data with LLMs as Evolutionary Optimizers. arXiv preprint arXiv:2503.14434","author":"Abhyankar Nikhil","year":"2025","unstructured":"Nikhil Abhyankar, Parshin Shojaee, and Chandan K Reddy. 2025. LLM-FE: Automated Feature Engineering for Tabular Data with LLMs as Evolutionary Optimizers. arXiv preprint arXiv:2503.14434 (2025)."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939785"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2019.00017"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/3696410.3714962"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/3511808.3557559"},{"key":"e_1_3_2_1_6_1","first-page":"4171","volume-title":"Proceedings of the 2019 conference of the North American chapter of the association for computational linguistics: human language technologies","volume":"1","author":"Devlin Jacob","year":"2019","unstructured":"Jacob Devlin, Ming-Wei Chang, Kenton Lee, and Kristina Toutanova. 2019. Bert: Pre-training of deep bidirectional transformers for language understanding. In Proceedings of the 2019 conference of the North American chapter of the association for computational linguistics: human language technologies, volume 1 (long and short papers). 4171-4186."},{"key":"e_1_3_2_1_7_1","unstructured":"Kalashnikov Dmitry Irpan Alex Pastor Peter Ibarz Julian Herzog Alexander Jang Eric Quillen Deirdre Holly Ethan Kalakrishnan Mrinal Vanhoucke Vincent et al. 2018. Qt-opt. Scalable deep reinforcement learning for vision-based robotic manipulation. arXiv preprint (2018)."},{"key":"e_1_3_2_1_8_1","first-page":"38","volume-title":"LightCS: Selecting Quadratic Feature Crosses in Linear Complexity. In Companion Proceedings of the ACM Web Conference","author":"Du Zhaocheng","year":"2024","unstructured":"Zhaocheng Du, Junhao Chen, Qinglin Jia, Chuhan Wu, Jieming Zhu, Zhenhua Dong, and Ruiming Tang. 2024a. LightCS: Selecting Quadratic Feature Crosses in Linear Complexity. In Companion Proceedings of the ACM Web Conference 2024. 38-46."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/3640457.3687094"},{"key":"e_1_3_2_1_10_1","first-page":"18932","article-title":"Revisiting deep learning models for tabular data","volume":"34","author":"Gorishniy Yury","year":"2021","unstructured":"Yury Gorishniy, Ivan Rubachev, Valentin Khrulkov, and Artem Babenko. 2021. Revisiting deep learning models for tabular data. Advances in Neural Information Processing Systems, Vol. 34 (2021), 18932-18943.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_11_1","volume-title":"DS-Agent: Automated Data Science by Empowering Large Language Models with Case-Based Reasoning. arXiv preprint arXiv:2402.17453","author":"Guo Siyuan","year":"2024","unstructured":"Siyuan Guo, Cheng Deng, Ying Wen, Hechang Chen, Yi Chang, and Jun Wang. 2024. DS-Agent: Automated Data Science by Empowering Large Language Models with Case-Based Reasoning. arXiv preprint arXiv:2402.17453 (2024)."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.52202\/075280-1938"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-024-08328-6"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.findings-acl.1016"},{"key":"e_1_3_2_1_15_1","volume-title":"Zijuan Lin, et al.","author":"Hong Sirui","year":"2023","unstructured":"Sirui Hong, Mingchen Zhuge, Jonathan Chen, Xiawu Zheng, Yuheng Cheng, Jinlin Wang, Ceyao Zhang, Zili Wang, Steven Ka Shing Yau, Zijuan Lin, et al., 2023. MetaGPT: Meta programming for a multi-agent collaborative framework. In The twelfth international conference on learning representations."},{"key":"e_1_3_2_1_16_1","volume-title":"Agentcoder: Multi-agent-based code generation with iterative testing and optimisation. arXiv preprint arXiv:2312.13010","author":"Huang Dong","year":"2023","unstructured":"Dong Huang, Jie M Zhang, Michael Luck, Qingwen Bu, Yuhao Qing, and Heming Cui. 2023. Agentcoder: Multi-agent-based code generation with iterative testing and optimisation. arXiv preprint arXiv:2312.13010 (2023)."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/3298689.3347043"},{"key":"e_1_3_2_1_18_1","volume-title":"AltFS: Agency-light Feature Selection with Large Language Models in Deep Recommender Systems. arXiv preprint arXiv:2412.08516","author":"Jia Pengyue","year":"2024","unstructured":"Pengyue Jia, Zhaocheng Du, Yichao Wang, Xiangyu Zhao, Xiaopeng Li, Yuhao Wang, Qidong Liu, Huifeng Guo, and Ruiming Tang. 2024a. AltFS: Agency-light Feature Selection with Large Language Models in Deep Recommender Systems. arXiv preprint arXiv:2412.08516 (2024)."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/3746252.3761378"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/3637528.3671571"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/DSAA.2015.7344858"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2016.0123"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11678"},{"key":"e_1_3_2_1_24_1","volume-title":"One button machine for automating feature engineering in relational databases. arXiv preprint arXiv:1706.00327","author":"Lam Hoang Thanh","year":"2017","unstructured":"Hoang Thanh Lam, Johann-Michael Thiebaut, Mathieu Sinn, Bei Chen, Tiep Mai, and Oznur Alkan. 2017. One button machine for automating feature engineering in relational databases. arXiv preprint arXiv:1706.00327 (2017)."},{"key":"e_1_3_2_1_25_1","volume-title":"The Eleventh International Conference on Learning Representations.","author":"Li Liyao","year":"2023","unstructured":"Liyao Li, Haobo Wang, Liangyu Zha, Qingyi Huang, Sai Wu, Gang Chen, and Junbo Zhao. 2023. Learning a Data-Driven Policy Network for Pre-Training Automated Feature Engineering. In The Eleventh International Conference on Learning Representations."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3403314"},{"key":"e_1_3_2_1_27_1","volume-title":"When and how to develop domain-specific languages. ACM computing surveys (CSUR)","author":"Mernik Marjan","year":"2005","unstructured":"Marjan Mernik, Jan Heering, and Anthony M Sloane. 2005. When and how to develop domain-specific languages. ACM computing surveys (CSUR), Vol. 37, 4 (2005), 316-344."},{"key":"e_1_3_2_1_28_1","volume-title":"Gsm-symbolic: Understanding the limitations of mathematical reasoning in large language models. arXiv preprint arXiv:2410.05229","author":"Mirzadeh Iman","year":"2024","unstructured":"Iman Mirzadeh, Keivan Alizadeh, Hooman Shahrokhi, Oncel Tuzel, Samy Bengio, and Mehrdad Farajtabar. 2024. Gsm-symbolic: Understanding the limitations of mathematical reasoning in large language models. arXiv preprint arXiv:2410.05229 (2024)."},{"key":"e_1_3_2_1_29_1","first-page":"92352","article-title":"Optimized feature generation for tabular data via llms with decision tree reasoning","volume":"37","author":"Nam Jaehyun","year":"2024","unstructured":"Jaehyun Nam, Kyuyoung Kim, Seunghyuk Oh, Jihoon Tack, Jaehyung Kim, and Jinwoo Shin. 2024. Optimized feature generation for tabular data via llms with decision tree reasoning. Advances in Neural Information Processing Systems, Vol. 37 (2024), 92352-92380.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_30_1","unstructured":"Alec Radford Karthik Narasimhan Tim Salimans Ilya Sutskever et al. 2018. Improving language understanding by generative pre-training. (2018)."},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE48307.2020.00146"},{"key":"e_1_3_2_1_32_1","unstructured":"Weisong Sun Chunrong Fang Yun Miao Yudu You Mengzhe Yuan Yuchen Chen Quanjun Zhang An Guo Xiang Chen Yang Liu et al. 2023. Abstract Syntax Tree for Programming Language Understanding and Representation: How Far Are We? arXiv preprint arXiv:2312.00413 (2023)."},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/3711896.3737266"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/3539618.3591767"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/3292500.3330949"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2021.107835"},{"key":"e_1_3_2_1_37_1","volume-title":"International Conference on Machine Learning. PMLR, 41880-41901","author":"Zhang Tianping","year":"2023","unstructured":"Tianping Zhang, Zheyu Aqa Zhang, Zhiyuan Fan, Haoyan Luo, Fengyuan Liu, Qian Liu, Wei Cao, and Li Jian. 2023. Openfe: Automated feature generation with expert-level performance. In International Conference on Machine Learning. PMLR, 41880-41901."},{"key":"e_1_3_2_1_38_1","volume-title":"Dynamic and adaptive feature generation with llm. arXiv preprint arXiv:2406.03505","author":"Zhang Xinhao","year":"2024","unstructured":"Xinhao Zhang, Jinghan Zhang, Banafsheh Rekabdar, Yuanchun Zhou, Pengfei Wang, and Kunpeng Liu. 2024. Dynamic and adaptive feature generation with llm. arXiv preprint arXiv:2406.03505 (2024)."},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1109\/ASE.2019.00077"},{"key":"e_1_3_2_1_40_1","volume-title":"International Conference on Automated Machine Learning. PMLR, 17-1.","author":"Zhu Guanghui","year":"2022","unstructured":"Guanghui Zhu, Zhuoer Xu, Chunfeng Yuan, and Yihua Huang. 2022. DIFER: differentiable automated feature engineering. In International Conference on Automated Machine Learning. PMLR, 17-1."}],"event":{"name":"WWW '26: The ACM Web Conference 2026","location":"Dubai United Arab Emirates","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web"]},"container-title":["Proceedings of the ACM Web Conference 2026"],"original-title":[],"deposited":{"date-parts":[[2026,4,10]],"date-time":"2026-04-10T16:36:57Z","timestamp":1775839017000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3774904.3792816"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,4,12]]},"references-count":40,"alternative-id":["10.1145\/3774904.3792816","10.1145\/3774904"],"URL":"https:\/\/doi.org\/10.1145\/3774904.3792816","relation":{},"subject":[],"published":{"date-parts":[[2026,4,12]]},"assertion":[{"value":"2026-04-12","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}