{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,4]],"date-time":"2024-09-04T21:58:25Z","timestamp":1725487105394},"publisher-location":"Berlin, Heidelberg","reference-count":24,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540732549"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1007\/978-3-540-73255-6_13","type":"book-chapter","created":{"date-parts":[[2007,6,29]],"date-time":"2007-06-29T13:04:04Z","timestamp":1183122244000},"page":"139-155","source":"Crossref","is-referenced-by-count":2,"title":["Fast Approximate Duplicate Detection for 2D-NMR Spectra"],"prefix":"10.1007","author":[{"given":"Bj\u00f6rn","family":"Egert","sequence":"first","affiliation":[]},{"given":"Steffen","family":"Neumann","sequence":"additional","affiliation":[]},{"given":"Alexander","family":"Hinneburg","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"13_CR1","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1016\/0003-2670(95)00322-Q","volume":"316","author":"A. Tsipouras","year":"1995","unstructured":"Tsipouras, A., Ondeyka, J., Dufresne, C., et al.: Using similarity searches over databases of estimated c-13 nmr spectra for structure identification of natural products. Analytica Chimica Acta\u00a0316, 161\u2013171 (1995)","journal-title":"Analytica Chimica Acta"},{"key":"13_CR2","doi-asserted-by":"publisher","first-page":"125","DOI":"10.1016\/j.chemolab.2005.01.003","volume":"78","author":"A.S. Barros","year":"2005","unstructured":"Barros, A.S., Rutledge, D.N.: Segmented principal component transform-principal component analysis. Chemometrics & Intelligent Laboratory Systems\u00a078, 125\u2013137 (2005)","journal-title":"Chemometrics & Intelligent Laboratory Systems"},{"key":"13_CR3","doi-asserted-by":"publisher","first-page":"39","DOI":"10.1145\/956750.956759","volume-title":"KDD \u201903: Proceedings of the ninth ACM SIGKDD international conference on Knowledge discovery and data mining","author":"M. Bilenko","year":"2003","unstructured":"Bilenko, M., Mooney, R.J.: Adaptive duplicate detection using learnable string similarity measures. In: KDD \u201903: Proceedings of the ninth ACM SIGKDD international conference on Knowledge discovery and data mining, pp. 39\u201348. ACM Press, New York (2003)"},{"key":"13_CR4","first-page":"1157","volume-title":"Selected papers from the sixth international conference on World Wide Web","author":"A.Z. Broder","year":"1997","unstructured":"Broder, A.Z., Glassman, S.C., Manasse, M.S., Zweig, G.: Syntactic clustering of the web. In: Selected papers from the sixth international conference on World Wide Web, pp. 1157\u20131166. Elsevier Science Publishers, Essex, UK (1997)"},{"issue":"2","key":"13_CR5","doi-asserted-by":"publisher","first-page":"171","DOI":"10.1145\/506309.506311","volume":"20","author":"A. Chowdhury","year":"2002","unstructured":"Chowdhury, A., Frieder, O., Grossman, D., McCabe, M.C.: Collection statistics for fast duplicate document detection. ACM Trans. Inf. Syst.\u00a020(2), 171\u2013191 (2002)","journal-title":"ACM Trans. Inf. Syst."},{"issue":"3","key":"13_CR6","doi-asserted-by":"publisher","first-page":"441","DOI":"10.1006\/jcss.1997.1534","volume":"55","author":"E. Cohen","year":"1997","unstructured":"Cohen, E.: Size-estimation framework with applications to transitive closure and reachability. J. Comput. Syst. Sci.\u00a055(3), 441\u2013453 (1997)","journal-title":"J. Comput. Syst. Sci."},{"key":"13_CR7","doi-asserted-by":"publisher","first-page":"189","DOI":"10.1145\/199404.199437","volume":"218","author":"J.D. Cohen","year":"1995","unstructured":"Cohen, J.D., Lin, M.C., Manocha, D., Ponamgi, M.K.: I-COLLIDE: An interactive and exact collision detection system for large-scale environments. Symposium on Interactive 3D Graphics\u00a0218, 189\u2013196 (1995)","journal-title":"Symposium on Interactive 3D Graphics"},{"key":"13_CR8","doi-asserted-by":"publisher","first-page":"443","DOI":"10.1145\/956863.956946","volume-title":"CIKM \u201903: Proceedings of the twelfth international conference on Information and knowledge management","author":"J.G. Conrad","year":"2003","unstructured":"Conrad, J.G., Guo, X.S., Schriber, C.P.: Online duplicate document detection: signature reliability in a dynamic retrieval environment. In: CIKM \u201903: Proceedings of the twelfth international conference on Information and knowledge management, pp. 443\u2013452. ACM Press, New York (2003)"},{"key":"13_CR9","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1145\/1142473.1142477","volume-title":"SIGMOD \u201906: Proceedings of the 2006 ACM SIGMOD international conference on Management of data","author":"F. Deng","year":"2006","unstructured":"Deng, F., Rafiei, D.: Approximately detecting duplicates for streaming data using stable bloom filters. In: SIGMOD \u201906: Proceedings of the 2006 ACM SIGMOD international conference on Management of data, pp. 25\u201336. ACM Press, New York (2006)"},{"key":"13_CR10","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1145\/375663.375689","volume-title":"SIGMOD \u201901: Proceedings of the 2001 ACM SIGMOD international conference on Management of data","author":"A. Gionis","year":"2001","unstructured":"Gionis, A., Gunopulos, D., Koudas, N.: Efficient and tunable similar set retrieval. In: SIGMOD \u201901: Proceedings of the 2001 ACM SIGMOD international conference on Management of data, pp. 247\u2013258. ACM Press, New York (2001)"},{"key":"13_CR11","first-page":"518","volume-title":"VLDB\u201999: Proceedings of the 25th International Conference on Very Large Data Bases","author":"A. Gionis","year":"1999","unstructured":"Gionis, A., Indyk, P., Motwani, R.: Similarity search in high dimensions via hashing. In: VLDB\u201999: Proceedings of the 25th International Conference on Very Large Data Bases, pp. 518\u2013529. Morgan Kaufmann Publishers, CA USA (1999)"},{"key":"13_CR12","doi-asserted-by":"publisher","first-page":"818","DOI":"10.1145\/1141277.1141465","volume-title":"SAC \u201906: Proceedings of the 2006 ACM symposium on Applied computing","author":"D. Gomes","year":"2006","unstructured":"Gomes, D., Santos, A.L., Silva, M.J.: Managing duplicates in a web archive. In: SAC \u201906: Proceedings of the 2006 ACM symposium on Applied computing, pp. 818\u2013825. ACM Press, New York, NY, USA (2006)"},{"key":"13_CR13","doi-asserted-by":"publisher","first-page":"284","DOI":"10.1145\/1148170.1148222","volume-title":"SIGIR \u201906: Proceedings of the 29th annual international ACM SIGIR conference on Research and development in information retrieval","author":"M. Henzinger","year":"2006","unstructured":"Henzinger, M.: Finding near-duplicate web pages: a large-scale evaluation of algorithms. In: SIGIR \u201906: Proceedings of the 29th annual international ACM SIGIR conference on Research and development in information retrieval, pp. 284\u2013291. ACM Press, New York (2006)"},{"issue":"1","key":"13_CR14","doi-asserted-by":"publisher","first-page":"9","DOI":"10.1023\/A:1009761603038","volume":"2","author":"M.A. Hernandez","year":"1998","unstructured":"Hernandez, M.A., Stolfo, S.J.: Real-world data is dirty: Data cleansing and the merge\/purge problem. Data. Mining and Knowledge Discovery\u00a02(1), 9\u201337 (1998)","journal-title":"Data Mining and Knowledge Discovery"},{"issue":"1","key":"13_CR15","doi-asserted-by":"crossref","first-page":"53","DOI":"10.1515\/jib-2007-53","volume":"4","author":"A. Hinneburg","year":"2007","unstructured":"Hinneburg, A., Egert, B., Porzel, A.: Duplicate detection of 2d-nmr spectra. Journal of Integrative Bioinformatics\u00a04(1), 53 (2007)","journal-title":"Journal of Integrative Bioinformatics"},{"key":"13_CR16","doi-asserted-by":"crossref","unstructured":"Indyk, P., Motwani, R.: Approximate nearest neighbor - towards removing the curse of dimensionality. In: Proceedings of the 30th Symposium on Theory of Computing, pp. 604\u2013613 (1998)","DOI":"10.1145\/276698.276876"},{"key":"13_CR17","doi-asserted-by":"publisher","first-page":"869","DOI":"10.1145\/1027527.1027729","volume-title":"MULTIMEDIA \u201904: Proceedings of the 12th annual ACM international conference on Multimedia","author":"Y. Ke","year":"2004","unstructured":"Ke, Y., Sukthankar, R., Huston, L.: An efficient parts-based near-duplicate and sub-image retrieval system. In: MULTIMEDIA \u201904: Proceedings of the 12th annual ACM international conference on Multimedia, pp. 869\u2013876. ACM Press, New York (2004)"},{"key":"13_CR18","doi-asserted-by":"publisher","first-page":"255","DOI":"10.1093\/jxb\/eri010","volume":"56","author":"P. Krishnan","year":"2005","unstructured":"Krishnan, P., Kruger, N.J., Ratcliffe, R.G.: Metabolite fingerprinting and profiling in plants using nmr. Journal of Experimental Botany\u00a056, 255\u2013265 (2005)","journal-title":"Journal of Experimental Botany"},{"key":"13_CR19","doi-asserted-by":"publisher","first-page":"173","DOI":"10.1016\/S0003-2670(00)80840-5","volume":"206","author":"M. Farkas","year":"1988","unstructured":"Farkas, M., Bendl, J., Welti, D.H., et al.: Similarity search for a h-1 nmr spectroscopic data base. Analytica Chimica Acta.\u00a0206, 173\u2013187 (1988)","journal-title":"Analytica Chimica Acta"},{"key":"13_CR20","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1145\/1060745.1060753","volume-title":"WWW \u201905: Proceedings of the 14th international conference on World Wide Web","author":"A. Metwally","year":"2005","unstructured":"Metwally, A., Agrawal, D., Abbadi, A.E.: Duplicate detection in click streams. In: WWW \u201905: Proceedings of the 14th international conference on World Wide Web, pp. 12\u201321. ACM Press, New York (2005)"},{"key":"13_CR21","doi-asserted-by":"publisher","first-page":"459","DOI":"10.1145\/1081870.1081923","volume-title":"KDD \u201905: Proceeding of the eleventh ACM SIGKDD international conference on Knowledge discovery in data mining","author":"G.N. Noren","year":"2005","unstructured":"Noren, G.N., Orre, R., Bate, A.: A hit-miss model for duplicate detection in the who drug safety database. In: KDD \u201905: Proceeding of the eleventh ACM SIGKDD international conference on Knowledge discovery in data mining, pp. 459\u2013468. ACM Press, New York (2005)"},{"key":"13_CR22","doi-asserted-by":"publisher","first-page":"1733","DOI":"10.1021\/ci0341363","volume":"43","author":"C. Steinbeck","year":"2003","unstructured":"Steinbeck, C., Krause, S., Kuhn, S.: Nmrshiftdb-constructing a free chemical information system with open-source components. J. chem. inf. & comp. sci.\u00a043, 1733\u20131739 (2003)","journal-title":"J. chem. inf. & comp. sci."},{"key":"13_CR23","doi-asserted-by":"crossref","first-page":"10","DOI":"10.1145\/1012453.1012456","volume-title":"IQIS \u201904: Proceedings of the 2004 international workshop on Information quality in information systems","author":"M. Weis","year":"2004","unstructured":"Weis, M., Naumann, F.: Detecting duplicate objects in xml documents. In: IQIS \u201904: Proceedings of the 2004 international workshop on Information quality in information systems, pp. 10\u201319. ACM Press, New York (2004)"},{"key":"13_CR24","doi-asserted-by":"publisher","first-page":"421","DOI":"10.1145\/1148170.1148243","volume-title":"SIGIR \u201906: Proceedings of the 29th annual international ACM SIGIR conference on Research and development in information retrieval","author":"H. Yang","year":"2006","unstructured":"Yang, H., Callan, J.: Near-duplicate detection by instance-level constrained clustering. In: SIGIR \u201906: Proceedings of the 29th annual international ACM SIGIR conference on Research and development in information retrieval, pp. 421\u2013428. ACM Press, New York (2006)"}],"container-title":["Lecture Notes in Computer Science","Data Integration in the Life Sciences"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-73255-6_13.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,12]],"date-time":"2023-05-12T15:10:24Z","timestamp":1683904224000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-73255-6_13"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"ISBN":["9783540732549"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-73255-6_13","relation":{},"subject":[]}}