{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,25]],"date-time":"2025-03-25T14:38:38Z","timestamp":1742913518240,"version":"3.40.3"},"publisher-location":"Cham","reference-count":18,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030742508"},{"type":"electronic","value":"9783030742515"}],"license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-74251-5_19","type":"book-chapter","created":{"date-parts":[[2021,4,12]],"date-time":"2021-04-12T15:20:40Z","timestamp":1618240840000},"page":"235-247","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["avatar\u2014Automated Feature Wrangling for Machine Learning"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-9182-597X","authenticated-orcid":false,"given":"Gust","family":"Verbruggen","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6502-0809","authenticated-orcid":false,"given":"Elia","family":"Van Wolputte","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0915-8034","authenticated-orcid":false,"given":"Sebastijan","family":"Duman\u010di\u0107","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6860-6303","authenticated-orcid":false,"given":"Luc","family":"De Raedt","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,4,13]]},"reference":[{"doi-asserted-by":"crossref","unstructured":"Bavishi, R., Lemieux, C., Fox, R., Sen, K., Stoica, I.: Autopandas: neural-backed generators for program synthesis. In: Proceedings of the ACM on Programming Languages 3(OOPSLA), pp. 1\u201327 (2019)","key":"19_CR1","DOI":"10.1145\/3360594"},{"doi-asserted-by":"crossref","unstructured":"Dasu, T., Johnson, T.: Exploratory Data Mining and Data Cleaning, vol. 479. Wiley, New York (2003)","key":"19_CR2","DOI":"10.1002\/0471448354"},{"doi-asserted-by":"crossref","unstructured":"Drosos, I., Barik, T., Guo, P.J., DeLine, R., Gulwani, S.: Wrex: a unified programming-by-example interaction for synthesizing readable code for data scientists. In: Proceedings of the 2020 CHI Conference on Human Factors in Computing Systems, pp. 1\u201312 (2020)","key":"19_CR3","DOI":"10.1145\/3313831.3376442"},{"key":"19_CR4","series-title":"The Springer Series on Challenges in Machine Learning","doi-asserted-by":"publisher","first-page":"113","DOI":"10.1007\/978-3-030-05318-5_6","volume-title":"Automated Machine Learning","author":"M Feurer","year":"2019","unstructured":"Feurer, M., Klein, A., Eggensperger, K., Springenberg, J.T., Blum, M., Hutter, F.: Auto-sklearn: efficient and robust automated machine learning. In: Hutter, F., Kotthoff, L., Vanschoren, J. (eds.) Automated Machine Learning. TSSCML, pp. 113\u2013134. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-05318-5_6"},{"issue":"10","key":"19_CR5","doi-asserted-by":"publisher","first-page":"1165","DOI":"10.14778\/3231751.3231766","volume":"11","author":"Y He","year":"2018","unstructured":"He, Y., Chu, X., Ganjam, K., Zheng, Y., Narasayya, V., Chaudhuri, S.: Transform-data-by-example (TDE) an extensible search engine for data transformations. Proc. VLDB Endow. 11(10), 1165\u20131177 (2018)","journal-title":"Proc. VLDB Endow."},{"doi-asserted-by":"crossref","unstructured":"Jin, Z., Anderson, M.R., Cafarella, M., Jagadish, H.: Foofah: transforming data by example. In: Proceedings of the 2017 ACM International Conference on Management of Data, pp. 683\u2013698 (2017)","key":"19_CR6","DOI":"10.1145\/3035918.3064034"},{"doi-asserted-by":"crossref","unstructured":"Kandel, S., Paepcke, A., Hellerstein, J., Heer, J.: Wrangler: interactive visual specification of data transformation scripts. In: Proceedings of the SIGCHI Conference on Human Factors in Computing Systems, pp. 3363\u20133372 (2011)","key":"19_CR7","DOI":"10.1145\/1978942.1979444"},{"doi-asserted-by":"crossref","unstructured":"Kanter, J.M., Veeramachaneni, K.: Deep feature synthesis: towards automating data science endeavors. In: 2015 IEEE International Conference on Data Science and Advanced Analytics (DSAA), pp. 1\u201310. IEEE (2015)","key":"19_CR8","DOI":"10.1109\/DSAA.2015.7344858"},{"doi-asserted-by":"crossref","unstructured":"Kaul, A., Maheshwary, S., Pudi, V.: Autolearn\u2013automated feature generation and selection. In: 2017 IEEE International Conference on Data Mining (ICDM), pp. 217\u2013226. IEEE (2017)","key":"19_CR9","DOI":"10.1109\/ICDM.2017.31"},{"doi-asserted-by":"crossref","unstructured":"Le, V., Gulwani, S.: Flashextract: a framework for data extraction by examples. In: Proceedings of the 35th ACM SIGPLAN Conference on Programming Language Design and Implementation, pp. 542\u2013553 (2014)","key":"19_CR10","DOI":"10.1145\/2594291.2594333"},{"issue":"1","key":"19_CR11","doi-asserted-by":"publisher","first-page":"2522","DOI":"10.1038\/s42256-019-0138-9","volume":"2","author":"SM Lundberg","year":"2020","unstructured":"Lundberg, S.M., et al.: From local explanations to global understanding with explainable AI for trees. Nat. Mach. Intell. 2(1), 2522\u20135839 (2020)","journal-title":"Nat. Mach. Intell."},{"unstructured":"Lundberg, S.M., Lee, S.I.: A unified approach to interpreting model predictions. In: Advances in Neural Information Processing Systems, pp. 4765\u20134774 (2017)","key":"19_CR12"},{"unstructured":"Olson, R.S., Moore, J.H.: TPOt: a tree-based pipeline optimization tool for automating machine learning. In: Workshop on Automatic Machine Learning, pp. 66\u201374. PMLR (2016)","key":"19_CR13"},{"key":"19_CR14","first-page":"381","volume":"1","author":"V Raman","year":"2001","unstructured":"Raman, V., Hellerstein, J.M.: Potter\u2019s wheel: an interactive data cleaning system. VLDB 1, 381\u2013390 (2001)","journal-title":"VLDB"},{"issue":"28","key":"19_CR15","first-page":"307","volume":"2","author":"LS Shapley","year":"1953","unstructured":"Shapley, L.S.: A value for n-person games. Contrib. Theor. Games 2(28), 307\u2013317 (1953)","journal-title":"Contrib. Theor. Games"},{"doi-asserted-by":"crossref","unstructured":"Van Wolputte, E., Korneva, E., Blockeel, H.: Mercs: multi-directional ensembles of regression and classification trees. In: Proceedings of the Thirty-Second AAAI Conference on Artificial Intelligence, pp. 4276\u20134283. AAAI Publications, New Orleans, Louisiana, USA (2018)","key":"19_CR16","DOI":"10.1609\/aaai.v32i1.11735"},{"doi-asserted-by":"crossref","unstructured":"Yan, C., He, Y.: Auto-suggest: learning-to-recommend data preparation steps using data science notebooks. In: Proceedings of the 2020 ACM SIGMOD International Conference on Management of Data, pp. 1539\u20131554 (2020)","key":"19_CR17","DOI":"10.1145\/3318464.3389738"},{"doi-asserted-by":"crossref","unstructured":"Yang, C., Akimoto, Y., Kim, D.W., Udell, M.: Oboe: collaborative filtering for autoML model selection. In: Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining, pp. 1173\u20131183 (2019)","key":"19_CR18","DOI":"10.1145\/3292500.3330909"}],"container-title":["Lecture Notes in Computer Science","Advances in Intelligent Data Analysis XIX"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-74251-5_19","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,24]],"date-time":"2022-12-24T03:05:04Z","timestamp":1671851104000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-74251-5_19"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"ISBN":["9783030742508","9783030742515"],"references-count":18,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-74251-5_19","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2021]]},"assertion":[{"value":"13 April 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"IDA","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Symposium on Intelligent Data Analysis","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Porto","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Portugal","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 April 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28 April 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"19","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ida2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/ida2021.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"EasyChair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"113","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"35","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"31% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"4","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"No","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"The conference was held online due to the COVID-19 pandemic","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}