{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,25]],"date-time":"2025-03-25T14:40:39Z","timestamp":1742913639057,"version":"3.40.3"},"publisher-location":"Cham","reference-count":30,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319639628"},{"type":"electronic","value":"9783319639628"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-319-63962-8_9-1","type":"book-chapter","created":{"date-parts":[[2018,8,25]],"date-time":"2018-08-25T07:03:28Z","timestamp":1535180608000},"page":"1-8","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Data Wrangling"],"prefix":"10.1007","author":[{"given":"Jeffrey","family":"Heer","sequence":"first","affiliation":[]},{"given":"Joseph M.","family":"Hellerstein","sequence":"additional","affiliation":[]},{"given":"Sean","family":"Kandel","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,2,5]]},"reference":[{"issue":"398","key":"9-1_CR1","first-page":"424","volume":"82","author":"DB Carr","year":"1987","unstructured":"Carr DB, Littlefield RJ, Nicholson W, Littlefield J (1987) Scatterplot matrix techniques for large N. J Am Stat Assoc 82(398):424\u2013436","journal-title":"J Am Stat Assoc"},{"key":"9-1_CR2","first-page":"833","volume-title":"Interactive generation of integrated schemas","author":"L Chiticariu","year":"2008","unstructured":"Chiticariu L, Kolaitis PG, Popa L (2008) Interactive generation of integrated schemas. In: ACM SIGMOD, pp 833\u2013846"},{"unstructured":"Codd EF (1971b) Further normalization of the data base relational model. In: Courant computer science symposia 6, Data base systems, (New York, May 24\u201325) pp 33\u201364, Prentice-Hall","key":"9-1_CR3"},{"key":"9-1_CR4","doi-asserted-by":"publisher","DOI":"10.1002\/0471448354","volume-title":"Exploratory data mining and data cleaning","author":"T Dasu","year":"2003","unstructured":"Dasu T, Johnson T (2003) Exploratory data mining and data cleaning. Wiley, New York"},{"key":"9-1_CR5","first-page":"240","volume-title":"Mining database structure; or, how to build a data quality browser","author":"T Dasu","year":"2002","unstructured":"Dasu T, Johnson T, Muthukrishnan S, Shkapenyuk V (2002) Mining database structure; or, how to build a data quality browser. In: ACM SIGMOD, pp 240\u2013251"},{"key":"9-1_CR6","volume-title":"Principles of data integration","author":"A Doan","year":"2012","unstructured":"Doan A, Halevy A, Ives Z (2012) Principles of data integration. Elsevier, Amsterdam"},{"key":"9-1_CR7","first-page":"100","volume-title":"The challenge of missing and uncertain data","author":"C Eaton","year":"2003","unstructured":"Eaton C, Plaisant C, Drizd T (2003) The challenge of missing and uncertain data. In: Proceedings of the IEEE visualization, p 100"},{"issue":"1","key":"9-1_CR8","first-page":"1","volume":"19","author":"AK Elmagarmid","year":"2007","unstructured":"Elmagarmid AK, Ipeirotis PG, Verykios VS (2007) Duplicate record detection: a survey. IEEE TKDE 19(1):1\u201316","journal-title":"IEEE TKDE"},{"doi-asserted-by":"crossref","unstructured":"Fisher K, Walker D (2011) The PADS project: an overview. In: International conference on database theory, Mar 2011","key":"9-1_CR9","DOI":"10.1145\/1938551.1938556"},{"key":"9-1_CR10","first-page":"590","volume-title":"AJAX: an extensible data cleaning tool","author":"H Galhardas","year":"2000","unstructured":"Galhardas H, Florescu D, Shasha D, Simon E (2000) AJAX: an extensible data cleaning tool. In: ACM SIGMOD, p 590"},{"key":"9-1_CR11","first-page":"317","volume-title":"Automating string processing in spreadsheets using input-output examples","author":"S Gulwani","year":"2011","unstructured":"Gulwani S (2011) Automating string processing in spreadsheets using input-output examples. In: ACM POPL, pp 317\u2013330"},{"doi-asserted-by":"crossref","unstructured":"Guo PJ, Kandel S, Hellerstein J, Heer J (2011) Proactive wrangling: mixed-initiative end-user programming of data transformation scripts. In: ACM user interface software & technology (UIST)","key":"9-1_CR12","DOI":"10.1145\/2047196.2047205"},{"key":"9-1_CR13","doi-asserted-by":"publisher","DOI":"10.1145\/1993498.1993536","volume-title":"Spreadsheet table transformations from examples","author":"W Harris","year":"2011","unstructured":"Harris W, Gulwani S (2011) Spreadsheet table transformations from examples. In: ACM PLDI"},{"key":"9-1_CR14","volume-title":"Predictive interaction for data transformation","author":"J Heer","year":"2015","unstructured":"Heer J, Hellerstein JM, Kandel S (2015) Predictive interaction for data transformation. In: CIDR"},{"key":"9-1_CR15","volume-title":"Quantitative data cleaning for large databases","author":"JM Hellerstein","year":"2008","unstructured":"Hellerstein JM (2008) Quantitative data cleaning for large databases. White Paper, United Nations Economic Commission for Europe"},{"issue":"2","key":"9-1_CR16","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1023\/B:AIRE.0000045502.10941.a9","volume":"22","author":"V Hodge","year":"2004","unstructured":"Hodge V, Austin J (2004) A survey of outlier detection methodologies. Artif Intell Rev 22(2):85\u2013126","journal-title":"Artif Intell Rev"},{"key":"9-1_CR17","first-page":"159","volume-title":"Principles of mixed-initiative user interfaces","author":"E Horvitz","year":"1999","unstructured":"Horvitz E (1999) Principles of mixed-initiative user interfaces. In: ACM CHI, pp 159\u2013166"},{"unstructured":"Huynh D, Mazzocchi S (2010) Google refine. \nhttp:\/\/code.google.com\/p\/google-refine\/","key":"9-1_CR18"},{"issue":"5","key":"9-1_CR19","first-page":"999","volume":"14","author":"H Kang","year":"2008","unstructured":"Kang H, Getoor L, Shneiderman B, Bilgic M, Licamele L (2008) Interactive entity resolution in relational data: a visual analytic tool and its evaluation. IEEE TVCG 14(5):999\u20131014","journal-title":"IEEE TVCG"},{"issue":"4","key":"9-1_CR20","doi-asserted-by":"publisher","first-page":"271","DOI":"10.1177\/1473871611415994","volume":"10","author":"S Kandel","year":"2011","unstructured":"Kandel S, Heer J, Plaisant C, Kennedy J, van Ham F, Riche NH, Weaver C, Lee B, Brodbeck D, Buono P (2011a) Research directions in data wrangling: visualizations and transformations for usable and credible data. Inf Vis J 10(4):271\u2013288","journal-title":"Inf Vis J"},{"doi-asserted-by":"crossref","unstructured":"Kandel S, Paepcke A, Hellerstein J, Heer J (2011b) Wrangler: interactive visual specification of data transformation scripts. In: ACM human factors in computing systems (CHI)","key":"9-1_CR21","DOI":"10.1145\/1978942.1979444"},{"doi-asserted-by":"crossref","unstructured":"Kandel S, Paepcke A, Hellerstein J, Heer J (2012a) Enterprise data analysis and visualization: an interview study. In: IEEE visual analytics science & technology (VAST)","key":"9-1_CR22","DOI":"10.1109\/TVCG.2012.219"},{"key":"9-1_CR23","doi-asserted-by":"publisher","DOI":"10.1145\/2254556.2254659","volume-title":"Profiler: integrated statistical analysis and visualization for data quality assessment","author":"S Kandel","year":"2012","unstructured":"Kandel S, Parikh R, Paepcke A, Hellerstein J, Heer J (2012b) Profiler: integrated statistical analysis and visualization for data quality assessment. In: Advanced visual interfaces"},{"issue":"4","key":"9-1_CR24","doi-asserted-by":"publisher","first-page":"476","DOI":"10.1145\/503099.503102","volume":"26","author":"LVS Lakshmanan","year":"2001","unstructured":"Lakshmanan LVS, Sadri F, Subramanian SN (2001) SchemaSQL: an extension to SQL for multidatabase interoperability. ACM Trans Database Syst 26(4): 476\u2013519","journal-title":"ACM Trans Database Syst"},{"key":"9-1_CR25","doi-asserted-by":"publisher","first-page":"334","DOI":"10.1007\/s007780100057","volume":"10","author":"E Rahm","year":"2001","unstructured":"Rahm E, Bernstein PA (2001) A survey of approaches to automatic schema matching. VLDB J 10:334\u2013350","journal-title":"VLDB J"},{"key":"9-1_CR26","first-page":"381","volume-title":"Potter\u2019s wheel: an interactive data cleaning system","author":"V Raman","year":"2001","unstructured":"Raman V, Hellerstein JM (2001) Potter\u2019s wheel: an interactive data cleaning system. In: VLDB, pp 381\u2013390"},{"key":"9-1_CR27","first-page":"431","volume-title":"Visualization of mappings between schemas","author":"GG Robertson","year":"2005","unstructured":"Robertson GG, Czerwinski MP, Churchill JE (2005) Visualization of mappings between schemas. In: ACM CHI, pp 431\u2013439"},{"key":"9-1_CR28","doi-asserted-by":"publisher","DOI":"10.1145\/775047.775087","volume-title":"Interactive deduplication using active learning","author":"S Sarawagi","year":"2002","unstructured":"Sarawagi S, Bhamidipaty A (2002) Interactive deduplication using active learning. In: ACM SIGKDD"},{"key":"9-1_CR29","volume-title":"Data curation at scale: the data tamer system","author":"M Stonebraker","year":"2013","unstructured":"Stonebraker M, Bruckner D, Ilyas IF, Beskales G, Cherniack M, Zdonik SB, Pagan A, Xu S (2013) Data curation at scale: the data tamer system. In: CIDR"},{"issue":"10","key":"9-1_CR30","doi-asserted-by":"publisher","first-page":"1","DOI":"10.18637\/jss.v059.i10","volume":"59","author":"H Wickham","year":"2014","unstructured":"Wickham H (2014) Tidy data. J Stat Softw 59(10):1\u201323","journal-title":"J Stat Softw"}],"container-title":["Encyclopedia of Big Data Technologies"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-63962-8_9-1","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,10]],"date-time":"2019-05-10T03:08:46Z","timestamp":1557457726000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-63962-8_9-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783319639628","9783319639628"],"references-count":30,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-63962-8_9-1","relation":{},"subject":[],"published":{"date-parts":[[2018]]},"assertion":[{"value":"5 February 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}