{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T11:55:13Z","timestamp":1743076513080,"version":"3.40.3"},"publisher-location":"Berlin, Heidelberg","reference-count":24,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642200441"},{"type":"electronic","value":"9783642200458"}],"license":[{"start":{"date-parts":[[2011,1,1]],"date-time":"2011-01-01T00:00:00Z","timestamp":1293840000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2011,1,1]],"date-time":"2011-01-01T00:00:00Z","timestamp":1293840000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2011]]},"DOI":"10.1007\/978-3-642-20045-8_7","type":"book-chapter","created":{"date-parts":[[2011,7,26]],"date-time":"2011-07-26T09:58:46Z","timestamp":1311674326000},"page":"133-150","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Dirty Data Management in Cloud Database"],"prefix":"10.1007","author":[{"given":"Hongzhi","family":"Wang","sequence":"first","affiliation":[]},{"given":"Jianzhong","family":"Li","sequence":"additional","affiliation":[]},{"given":"Jinbao","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Hong","family":"Gao","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2011,5,17]]},"reference":[{"unstructured":"Eckerson, W.W.: Xml for analysis specification. Technical Report, The Data Warehousing Institute. http:\/\/www.tdwi.org\/research\/display.aspx?ID\u2009=\u20096064, 2002","key":"7_CR1"},{"issue":"3","key":"7_CR2","doi-asserted-by":"publisher","first-page":"136","DOI":"10.2307\/41166093","volume":"43","author":"A Raman","year":"2001","unstructured":"Raman, A., DeHoratius, N., Ton, Z.:\u00a0Execution: The missing link in retail operations. Calif. Manag. Rev. 43(3), 136\u2013152 (2001)","journal-title":"Calif. Manag. Rev."},{"issue":"4","key":"7_CR3","first-page":"3","volume":"23","author":"E Rahm","year":"2000","unstructured":"Rahm, E.,\u00a0Do, H.H.: Data cleaning: Problems and current approaches. IEEE Data Eng. Bull. 23(4), 3\u201313 (2000)","journal-title":"IEEE Data Eng. Bull."},{"doi-asserted-by":"crossref","unstructured":"Fuxman, A.,\u00a0 Miller, R.J.: First-order query rewriting for inconsistent databases. In: ICDT, pp.\u00a0337\u2013351 (2005)","key":"7_CR4","DOI":"10.1007\/978-3-540-30570-5_23"},{"doi-asserted-by":"crossref","unstructured":"Fuxman, A., Fazli, E.,\u00a0Miller, R.J.: Conquer: Efficient management of inconsistent databases. In: SIGMOD Conference, pp. 155\u2013166 (2005)","key":"7_CR5","DOI":"10.1145\/1066157.1066176"},{"doi-asserted-by":"crossref","unstructured":"Andritsos, P.,\u00a0Fuxman, A.,\u00a0Miller, R.J.: Clean answers over dirty databases: A probabilistic approach. In: ICDE, p.\u00a030 (2006)","key":"7_CR6","DOI":"10.1109\/ICDE.2006.35"},{"key":"7_CR7","volume-title":"Database system implementation","author":"H Garcia-Molina","year":"2000","unstructured":"Garcia-Molina, H.,\u00a0Ullman, J.D., Widom, J.: Database system implementation. Prentice-Hall, NJ (2000)"},{"unstructured":"Li, C.,\u00a0Wang, B.,\u00a0Yang, X.:\u00a0Vgram: Improving performance of approximate queries on string collections using variable-length grams. In: VLDB, pp. 303\u2013314 (2007)","key":"7_CR8"},{"key":"7_CR9","volume-title":"Modern information retrieval","author":"RA Baeza-Yates","year":"1999","unstructured":"Baeza-Yates, R.A., Ribeiro-Neto, B.A.: Modern information retrieval. ACM, NY (1999)"},{"key":"7_CR10","volume-title":"Introduction to algorithms","author":"TH Cormen","year":"2001","unstructured":"Cormen, T.H., Leiserson, C.E., Rivest, R.L., Stein, C.: Introduction to algorithms, 2nd edn. MIT, MA (2001)","edition":"2"},{"issue":"9","key":"7_CR11","doi-asserted-by":"publisher","first-page":"490","DOI":"10.1145\/367390.367400","volume":"3","author":"E Fredkin","year":"1960","unstructured":"Fredkin, E.:\u00a0Trie memory. Commun. ACM 3(9), 490\u2013499 (1960)","journal-title":"Commun. ACM"},{"issue":"1","key":"7_CR12","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1016\/j.cosrev.2007.05.001","volume":"1","author":"SE Schaeffer","year":"2007","unstructured":"Schaeffer, S.E.: Graph clustering. Comp. Sci. Rev. 1(1), 27\u201364 (2007)","journal-title":"Comp. Sci. Rev."},{"doi-asserted-by":"crossref","unstructured":"Sarawagi, S.\u00a0, Kirpal, A.:\u00a0Efficient set joins on similarity predicates. In: SIGMOD Conference, pp. 743\u2013754 (2004)","key":"7_CR13","DOI":"10.1145\/1007568.1007652"},{"doi-asserted-by":"crossref","unstructured":"Xiao, C.,\u00a0Wang, W.,\u00a0Lin, X.,\u00a0Yu, J.X.: Efficient similarity joins for near duplicate detection. In: WWW, pp. 131\u2013140 (2008)","key":"7_CR14","DOI":"10.1145\/1367497.1367516"},{"doi-asserted-by":"crossref","unstructured":"Ghemawat, S., Gobioff, H., Leung, S.-T.: The Google file system. In: SOSP 2003, pp. 29\u201343","key":"7_CR15","DOI":"10.1145\/1165389.945450"},{"doi-asserted-by":"crossref","unstructured":"Chang, F., Dean, J., Ghemawat, S., Hsieh, W.C., Wallach, D.A., Burrows, M., Chandra, T., Fikes, A., Gruber, R.E.: Bigtable: a distributed storage system for structured data. ACM Trans. Comput. Syst. 26(2) (2008)","key":"7_CR16","DOI":"10.1145\/1365815.1365816"},{"unstructured":"Apache Hadoop http:\/\/hadoop.apache.org\/","key":"7_CR17"},{"issue":"2","key":"7_CR18","first-page":"1277","volume":"1","author":"BF Cooper","year":"2008","unstructured":"Cooper, B.F., Ramakrishnan, R., Srivastava, U., Silberstein, A., Bohannon, P., Jacobsen, H.A.: PNUTS: Yahoo!\u2019s hosted data serving platform. PVLDB 1(2), 1277\u20131288 (2008)","journal-title":"PVLDB"},{"doi-asserted-by":"crossref","unstructured":"DeCandia, G., Hastorun, D., Jampani, M., Kakulapati, G., Lakshman, A., Pilchin, A., Sivasubramanian, S., Vosshall, P., Vogels,W.: Dynamo: Amazon\u2019s highly available key-value store. In: SIGOPS, pp. 205\u2013220 (2007)","key":"7_CR19","DOI":"10.1145\/1323293.1294281"},{"unstructured":"Weil, S.A., Brandt, S.A., Miller, E.L., Long, D.D.E.: Ceph: a scalable, high-performance distributed file system. In: SODI, pp. 307\u2013320 (2006)","key":"7_CR20"},{"key":"7_CR21","volume-title":"Sinfonia: A new paradigm for building scalable distributed systems","author":"MK Aguilera","year":"2007","unstructured":"Aguilera, M.K., Merchant, A.,\u00a0Shah, M.,\u00a0Veitch, A.,\u00a0Karamanolis, C.: Sinfonia: A new paradigm for building scalable distributed systems. In: SOSP 2007"},{"key":"7_CR22","volume-title":"Mapreduce: Simplified data processing on large clusters","author":"J Dean","year":"2004","unstructured":"Dean, J., Ghemawat, S.: Mapreduce: Simplified data processing on large clusters. In: OSDI\u00a02004"},{"doi-asserted-by":"crossref","unstructured":"Yang, H.-C., Dasdan, A.,\u00a0Hsiao, R.-L., Parker, D.S.: Map-reduce-merge: Simplified relational data processing on large clusters. In: SIGMOD, pp. 1029\u20131040 (2007)","key":"7_CR23","DOI":"10.1145\/1247480.1247602"},{"issue":"1","key":"7_CR24","first-page":"922","volume":"2","author":"A Abouzeid","year":"2009","unstructured":"Abouzeid, A.,\u00a0Bajda-Pawlikowski, K.,\u00a0Abadi, D.J., Rasin, A.,\u00a0Silberschatz, A.: Hadoopdb: An architectural hybrid of mapreduce and dbms technologies for analytical workloads. PVLDB 2(1), 922\u2013933 (2009)","journal-title":"PVLDB"}],"container-title":["Grid and Cloud Database Management"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-20045-8_7","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,4,17]],"date-time":"2023-04-17T05:03:41Z","timestamp":1681707821000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-642-20045-8_7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011]]},"ISBN":["9783642200441","9783642200458"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-20045-8_7","relation":{},"subject":[],"published":{"date-parts":[[2011]]},"assertion":[{"value":"17 May 2011","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}