{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,17]],"date-time":"2025-10-17T14:02:12Z","timestamp":1760709732226},"reference-count":58,"publisher":"Oxford University Press (OUP)","issue":"3","license":[{"start":{"date-parts":[[2018,11,3]],"date-time":"2018-11-03T00:00:00Z","timestamp":1541203200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/academic.oup.com\/journals\/pages\/open_access\/funder_policies\/chorus\/standard_publication_model"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019,3,1]]},"DOI":"10.1093\/comjnl\/bxy113","type":"journal-article","created":{"date-parts":[[2018,10,12]],"date-time":"2018-10-12T19:12:57Z","timestamp":1539371577000},"page":"461-480","source":"Crossref","is-referenced-by-count":7,"title":["A Conceptual Approach for Supporting Traffic Data Wrangling Tasks"],"prefix":"10.1093","volume":"62","author":[{"given":"Sandra","family":"Sampaio","sequence":"first","affiliation":[{"name":"Information Management Group, School of Computer Science, University of Manchester, Manchester, UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mashael","family":"Aljubairah","sequence":"additional","affiliation":[{"name":"Information Management Group, School of Computer Science, University of Manchester, Manchester, UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hapsoro Adi","family":"Permana","sequence":"additional","affiliation":[{"name":"Information Management Group, School of Computer Science, University of Manchester, Manchester, UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Pedro","family":"Sampaio","sequence":"additional","affiliation":[{"name":"Alliance Manchester Business School, University of Manchester, Manchester, UK"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"286","published-online":{"date-parts":[[2018,11,3]]},"reference":[{"key":"key\n\t\t\t\t2019030411255518200_bxy113C1","author":"Lopes","year":"2010"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C2","first-page":"94","volume-title":"Knowledge Discovery from Sensor Data","author":"Hutchins","year":"2008"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C3","doi-asserted-by":"crossref","first-page":"86","DOI":"10.1145\/2611567","article-title":"Big data and its technical challenges","volume":"57","author":"Jagadish","year":"2014","journal-title":"Commun. ACM"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C4","author":"Furche","year":"2016"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C5","author":"Terrizzano","year":"2015"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C6","doi-asserted-by":"crossref","first-page":"389","DOI":"10.1007\/s00778-007-0044-3","article-title":"Service oriented architectures: approaches, technologies and research issues","volume":"16","author":"Papazoglou","year":"2007","journal-title":"The VLDB Journal"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C7","volume-title":"Business Process Management\u2014Concepts, Languages, Architectures","author":"Weske","year":"2007"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C8","doi-asserted-by":"crossref","first-page":"18","DOI":"10.1145\/2694428.2694432","article-title":"Towards total traffic awareness","volume":"43","author":"Guo","year":"2014","journal-title":"SIGMOD Record"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C9","first-page":"1067","volume-title":"Concurr. Comp. Pract. Exp.","author":"Oinn","year":"2006"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C10","volume-title":"Foundations of Databases: The Logical Level","author":"Abiteboul","year":"1995","edition":"1st edn"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C11","doi-asserted-by":"crossref","DOI":"10.1002\/9781119183686","volume-title":"Data Science and Big Data Analytics: Discovering, Analyzing, Visualizing and Presenting Data","author":"Services","year":"2015"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C12","author":"Kandel","year":"2011"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C13","author":"Tye Rattenbury","year":"2016"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C14","author":"Endel","year":"2015"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C15","first-page":"3","article-title":"Data cleaning: problems and current approaches","volume":"23","author":"Rahm","year":"2000","journal-title":"IEEE Data Eng. Bull."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C16","volume-title":"Domain-Specific Languages Addison-Wesley Signature Series","author":"Fowler","year":"2011"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C17","author":"Trifacta","year":"2017"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C18","author":"OpenRefine-Google","year":"2017"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C19","volume-title":"Compilers: Principles, Techniques, and Tools","author":"Aho","year":"2006","edition":"2nd edn"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C20","volume-title":"Computers and Intractability: A Guide to the Theory of NP-Completeness","author":"Garey","year":"1990"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C21","doi-asserted-by":"crossref","first-page":"323","DOI":"10.1145\/27633.27634","article-title":"A comparative analysis of methodologies for database schema integration","volume":"18","author":"Batini","year":"1986","journal-title":"ACM Comput. Surv."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C22","author":"Aristaran","year":"2016"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C23","author":"Github","year":"2018"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C24","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3076253","article-title":"Data science: a comprehensive overview","volume":"50","author":"Cao","year":"2017","journal-title":"ACM Comput. Surv."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C25","author":"Meehan","year":"2017"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C26","doi-asserted-by":"crossref","first-page":"557","DOI":"10.1007\/s00778-015-0389-y","article-title":"Profiling relational data: a survey","volume":"24","author":"Abedjan","year":"2015","journal-title":"VLDB J."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C27","author":"Larsson","year":"2013"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C28","author":"Mike Tuchen","year":"2005"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C29","author":"Ihaka","year":"1993"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C30","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-84996-095-3","volume-title":"Introduction to Databases: From Biological to Spatio-Temporal","author":"Revesz","year":"2010","edition":"1st edn"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C31","doi-asserted-by":"crossref","first-page":"18","DOI":"10.1145\/2694428.2694432","article-title":"Towards total traffic awareness","volume":"43","author":"Guo","year":"2014","journal-title":"ACM SIGMOD Record"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C32","doi-asserted-by":"crossref","DOI":"10.1145\/1206049.1206056","article-title":"Spatial join techniques","volume":"32","author":"Jacox","year":"2007","journal-title":"ACM Trans. Database Syst."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C33","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4614-6396-2","volume-title":"Outlier Analysis","author":"Aggarwal","year":"2013"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C34","author":"Guarino","year":"1998"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C35","doi-asserted-by":"crossref","first-page":"489","DOI":"10.1016\/0306-4379(93)90004-K","article-title":"Formal definition of a conceptual language for the description and manipulation of information models","volume":"18","author":"ter Hofstede","year":"1993","journal-title":"Inf. Syst."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C36","volume-title":"Principles of Compiler Design","author":"Aho","year":"1977"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C37","doi-asserted-by":"crossref","first-page":"79","DOI":"10.1002\/spe.2374","article-title":"The anatomy of big data computing","volume":"46","author":"Kune","year":"2016","journal-title":"Softw. Pract. Exp."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C38","volume-title":"Structure and Interpretation of Computer Programs","author":"Abelson","year":"1996","edition":"2nd edn"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C39","doi-asserted-by":"crossref","first-page":"265","DOI":"10.1177\/0023830913484897","article-title":"Three design principles of language: the search for parsimony in redundancy","volume":"56","author":"Beekhuizen","year":"2013","journal-title":"Lang. Speech"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C40","doi-asserted-by":"crossref","first-page":"377","DOI":"10.1145\/362384.362685","article-title":"A relational model of data for large shared data banks","volume":"13","author":"Codd","year":"1970","journal-title":"Commun. ACM"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C41","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/S0169-023X(00)00020-3","article-title":"Query processing in doql: a deductive database language for the odmg model","volume":"35","author":"Sampaio","year":"2000","journal-title":"Data Knowl. Eng."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C42","doi-asserted-by":"crossref","first-page":"8304","DOI":"10.1016\/j.eswa.2015.06.050","article-title":"Dq2s\u2014a framework for data quality-aware information management","volume":"42","author":"Mendes Sampaio","year":"2015","journal-title":"Expert Syst. Appl."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C43","doi-asserted-by":"crossref","first-page":"63","DOI":"10.1002\/cpe.907","article-title":"Measuring and modelling the performance of a parallel odmg compliant object database server","volume":"18","author":"Sampaio","year":"2006","journal-title":"Concurr. Comp. Pract. Exp."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C44","author":"Hasan","year":"1993"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C45","doi-asserted-by":"crossref","first-page":"427","DOI":"10.1002\/(SICI)1097-024X(199604)26:4<427::AID-SPE20>3.0.CO;2-H","article-title":"Iterators, schedulers, and distributed-memory parallelism","volume":"26","author":"Graefe","year":"1996","journal-title":"Softw. Pract. Exp."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C46","doi-asserted-by":"crossref","first-page":"111","DOI":"10.1145\/356924.356928","article-title":"Query optimization in database systems","volume":"16","author":"Jarke","year":"1984","journal-title":"ACM Comput. Surv."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C47","author":"Raman","year":"2001"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C48","author":"Lakshmanan","year":"1996"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C49","author":"Lee","year":"1999"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C50","author":"Savinov","year":"2017"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C51","doi-asserted-by":"crossref","first-page":"502","DOI":"10.4018\/978-1-4666-5202-6.ch045","volume-title":"Encyclopedia of Business Analytics and Optimization","author":"Savinov","year":"2014"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C52","author":"Konstantinou","year":"2017"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C53","volume-title":"Logic Programming and Databases","author":"Ceri","year":"2012","edition":"1st edn"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C54","author":"Dijkstra","year":"1982"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C55","doi-asserted-by":"crossref","first-page":"1121","DOI":"10.1109\/TVCG.2009.174","article-title":"Protovis: a graphical toolkit for visualization","volume":"15","author":"Bostock","year":"2009","journal-title":"IEEE Trans. Vis. Comput. Graph."},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C56","author":"Apache","year":"2014"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C57","author":"Sehgal","year":"2006"},{"key":"key\n\t\t\t\t2019030411255518200_bxy113C58","doi-asserted-by":"crossref","first-page":"38","DOI":"10.2307\/2309088","article-title":"The cosine-haversine formula","volume":"64","author":"Robusto","year":"1957","journal-title":"Am. Math. Mon."}],"container-title":["The Computer Journal"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/academic.oup.com\/comjnl\/article-pdf\/62\/3\/461\/28009363\/bxy113.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,26]],"date-time":"2019-10-26T15:08:58Z","timestamp":1572102538000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/comjnl\/article\/62\/3\/461\/5158248"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,11,3]]},"references-count":58,"journal-issue":{"issue":"3","published-online":{"date-parts":[[2018,11,3]]},"published-print":{"date-parts":[[2019,3,1]]}},"URL":"https:\/\/doi.org\/10.1093\/comjnl\/bxy113","relation":{},"ISSN":["0010-4620","1460-2067"],"issn-type":[{"value":"0010-4620","type":"print"},{"value":"1460-2067","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2019,3]]},"published":{"date-parts":[[2018,11,3]]}}}