{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,12]],"date-time":"2025-12-12T13:07:40Z","timestamp":1765544860354,"version":"3.37.3"},"reference-count":65,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"9","license":[{"start":{"date-parts":[[2023,9,1]],"date-time":"2023-09-01T00:00:00Z","timestamp":1693526400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,9,1]],"date-time":"2023-09-01T00:00:00Z","timestamp":1693526400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,9,1]],"date-time":"2023-09-01T00:00:00Z","timestamp":1693526400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100000266","name":"Engineering and Physical Sciences Research Council","doi-asserted-by":"publisher","award":["EP\/N510129\/1"],"award-info":[{"award-number":["EP\/N510129\/1"]}],"id":[{"id":"10.13039\/501100000266","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100012338","name":"Alan Turing Institute","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100012338","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100012338","name":"Alan Turing Institute","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100012338","id-type":"DOI","asserted-by":"publisher"}]},{"name":"SIRIUS Centre for Scalable Data Access","award":["237889"],"award-info":[{"award-number":["237889"]}]},{"DOI":"10.13039\/100012338","name":"Alan Turing Institute","doi-asserted-by":"publisher","award":["TU\/C\/000018"],"award-info":[{"award-number":["TU\/C\/000018"]}],"id":[{"id":"10.13039\/100012338","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Knowl. Data Eng."],"published-print":{"date-parts":[[2023,9,1]]},"DOI":"10.1109\/tkde.2022.3222538","type":"journal-article","created":{"date-parts":[[2022,11,16]],"date-time":"2022-11-16T20:43:48Z","timestamp":1668631428000},"page":"9295-9306","source":"Crossref","is-referenced-by-count":11,"title":["AI Assistants: A Framework for Semi-Automated Data Wrangling"],"prefix":"10.1109","volume":"35","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7242-2208","authenticated-orcid":false,"given":"Tomas","family":"Petricek","sequence":"first","affiliation":[{"name":"Charles University, Prague, Czechia"}]},{"given":"Gerrit J. J. van den","family":"Burg","sequence":"additional","affiliation":[{"name":"Alan Turing Institute, London, U.K."}]},{"given":"Alfredo","family":"Naz\u00e1bal","sequence":"additional","affiliation":[{"name":"Alan Turing Institute, London, U.K."}]},{"given":"Taha","family":"Ceritli","sequence":"additional","affiliation":[{"name":"University of Edinburgh and Alan Turing Institute, London, U.K."}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9083-4599","authenticated-orcid":false,"given":"Ernesto","family":"Jim\u00e9nez-Ruiz","sequence":"additional","affiliation":[{"name":"City, University of London, London, U.K."}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6270-4703","authenticated-orcid":false,"given":"Christopher K. I.","family":"Williams","sequence":"additional","affiliation":[{"name":"University of Edinburgh, Edinburgh, U.K."}]}],"member":"263","reference":[{"year":"2016","key":"ref1","article-title":"Data science report"},{"year":"2017","key":"ref2","article-title":"The state of data science & machine learning"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2020.106622"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3495256"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/s10618-019-00646-y"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3220057"},{"key":"ref7","first-page":"1","article-title":"pandas: A foundational Python library for data analysis and statistics","volume":"14","author":"McKinney","year":"2011","journal-title":"Python High Perform. Sci. Comput."},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.21105\/joss.01686"},{"year":"2021","key":"ref9","article-title":"Trifacta \u2013 data wrangling softaware and tools"},{"article-title":"OpenRefine: A free, open source, powerful tool for working with messy data","year":"2021","author":"Delpeuch","key":"ref10"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/1989323.1989449"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1177\/1473871611415994"},{"article-title":"Tabula","year":"2021","author":"Aristar\u00e1n","key":"ref13"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/2240236.2240260"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/1376616.1376759"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2007.250581"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.22152\/programming-journal.org\/2020\/4\/8"},{"key":"ref18","first-page":"1","article-title":"Predictive interaction for data transformation","volume-title":"Proc. Conf. Innov. Data Syst. Res.","author":"Heer"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.14778\/1952376.1952378"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3035918.3064024"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/302979.303030"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/VL\/HCC50065.2020.9127254"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3209900.3209913"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/2047196.2047205"},{"year":"2018","key":"ref25","article-title":"Open data"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-61455-2_12"},{"article-title":"Practical coreset constructions for machine learning","year":"2017","author":"Bachem","key":"ref27"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1002\/nav.3800020109"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.17487\/rfc4180"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/s10618-020-00680-1"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.330129"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.2200\/S01125ED1V01Y202109DSK022"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.3233\/SW-140134"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-49461-2_30"},{"article-title":"Data engineering for data analytics: A classification of the issues, and case studies","year":"2020","author":"Naz\u00e1bal","key":"ref35"},{"article-title":"UCI machine learning repository","year":"2013","author":"Bache","key":"ref36"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1002\/SERIES1345"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1145\/2939502.2939511"},{"key":"ref39","first-page":"140","article-title":"The end-user programming challenge of data wrangling","volume-title":"Proc. 27th Annu. Workshop Psychol. Program. Int. Group","author":"Gorinova"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1145\/3533378"},{"key":"ref41","first-page":"1","article-title":"Wrattler: Reproducible, live and polyglot notebooks","volume-title":"Proc. 10th USENIX Workshop Theory Pract. Provenance","author":"Petricek"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107501"},{"key":"ref43","first-page":"1927","article-title":"PClean: Bayesian data cleaning at scale with domain-specific probabilistic programming","volume-title":"Proc. Int. Conf. Artif. Intell. Statist.","author":"Lew"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2017.199"},{"key":"ref45","first-page":"381","article-title":"Potters wheel: An interactive data cleaning system","volume-title":"Proc. 27th Int. Conf. Very Large Data Bases","author":"Raman"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1145\/1366102.1366103"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1145\/3332165.3347940"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2016.2599030"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1145\/1595696.1595728"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1145\/2429376.2429378"},{"key":"ref51","first-page":"21:1","article-title":"Data exploration through dot-driven development","volume-title":"Proc. 31st Eur. Conf. Object-Oriented Program.","author":"Petricek"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/2.781635"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1145\/142750.143082"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1145\/263407.263545"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1145\/2380116.2380144"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.14778\/2824032.2824127"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1145\/2984511.2984588"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1145\/3173574.3174047"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.14778\/3137765.3137833"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300233"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1145\/3328519.3329133"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1145\/2463676.2465327"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1145\/2723372.2749431"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.14778\/2350229.2350263"},{"key":"ref65","first-page":"137","article-title":"Programming by examples (and its applications in data wrangling)","volume-title":"Dependable Software Systems Engineering (NATO Science for Peace and Security - D: Information and Communication Security)","author":"Gulwani","year":"2016"}],"container-title":["IEEE Transactions on Knowledge and Data Engineering"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/69\/10210449\/09953543.pdf?arnumber=9953543","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,1]],"date-time":"2024-02-01T03:15:50Z","timestamp":1706757350000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9953543\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,9,1]]},"references-count":65,"journal-issue":{"issue":"9"},"URL":"https:\/\/doi.org\/10.1109\/tkde.2022.3222538","relation":{},"ISSN":["1041-4347","1558-2191","2326-3865"],"issn-type":[{"type":"print","value":"1041-4347"},{"type":"electronic","value":"1558-2191"},{"type":"electronic","value":"2326-3865"}],"subject":[],"published":{"date-parts":[[2023,9,1]]}}}