{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T06:04:59Z","timestamp":1725516299893},"publisher-location":"Berlin, Heidelberg","reference-count":27,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540698272"},{"type":"electronic","value":"9783540698289"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1007\/978-3-540-69828-9_9","type":"book-chapter","created":{"date-parts":[[2008,8,12]],"date-time":"2008-08-12T16:07:43Z","timestamp":1218557263000},"page":"92-107","source":"Crossref","is-referenced-by-count":0,"title":["An Entity Resolution Framework for Deduplicating Proteins"],"prefix":"10.1007","author":[{"given":"Lucas","family":"Lochovsky","sequence":"first","affiliation":[]},{"given":"Thodoros","family":"Topaloglou","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"9_CR1","doi-asserted-by":"publisher","first-page":"1985","DOI":"10.1002\/pmic.200300721","volume":"4","author":"P.J. Kersey","year":"2004","unstructured":"Kersey, P.J., Duarte, J., Williams, A., Karavidopoulou, Y., Birney, E., Apweiler, R.: The International Protein Index: An integrated database for proteomics experiments. Proteomics\u00a04, 1985\u20131988 (2004)","journal-title":"Proteomics"},{"key":"9_CR2","doi-asserted-by":"crossref","unstructured":"Birkland, A., Yona, G.: BIOZON: a system for unification, management and analysis of heterogeneous biological data. BMC Bioinformatics\u00a07(70) (2006)","DOI":"10.1186\/1471-2105-7-70"},{"key":"9_CR3","volume-title":"Biochemistry","author":"J.M. Berg","year":"2006","unstructured":"Berg, J.M., Tymoczko, J.L., Stryer, L.: Biochemistry, 5th edn. W.H. Freeman, New York (2006)","edition":"5"},{"key":"9_CR4","doi-asserted-by":"crossref","first-page":"W298","DOI":"10.1093\/nar\/gkl128","volume":"34","author":"C. Prieto","year":"2006","unstructured":"Prieto, C., Rivas, J.D.L.: APID: Agile Protein Interaction DataAnalyzer. Nucleic Acids Research\u00a034, W298\u2013W302 (2006)","journal-title":"Nucleic Acids Research"},{"key":"9_CR5","unstructured":"National Center for Biotechnology Information (NCBI), http:\/\/www.ncbi.nlm.nih.gov"},{"key":"9_CR6","unstructured":"Hubbard, T., Andrews, D., Caccamo, M., Cameron, G., Chen, Y., Clamp, M., Clarke, L., Coates, G., Cox, T., Cunningham, F., Curwen, V., Cutts, T., Down, T., Durbin, R., Fernandez-Suarez, X.M., Gilbert, J., Hammond, M., Herrero, J., Hotz, H., Howe, K., Iyer, V., Jekosch, K., Kahari, A., Kasprzyk, A., Keefe, D., Keenan, S., Kokocinsci, F., London, D., Longden, I., McVicker, G., Melsopp, C., Meidl, P., Potter, S., Proctor, G., Rae, M., Rios, D., Schuster, M., Searle, S., Severin, J., Slater, G., Smedley, D., Smith, J., Spooner, W., Stabenau, A., Stalker, J., Storey, R., Trevanion, S., Ureta-Vidal, A., Vogel, J., White, S., Woodwark, C., Birney, E.: Ensembl 2005. Nucleic Acids Research\u00a033(Database issue), D447\u2013D453 (2005)"},{"key":"9_CR7","doi-asserted-by":"crossref","unstructured":"The UniProt Consortium. The Universal Protein Resource (UniProt). Nucleic Acids Research 35, 193\u2013197 (2007)","DOI":"10.1093\/nar\/gkl929"},{"issue":"1","key":"9_CR8","doi-asserted-by":"publisher","first-page":"248","DOI":"10.1093\/nar\/gkg056","volume":"31","author":"G.D. Bader","year":"2003","unstructured":"Bader, G.D., Betel, D., Hogue, C.V.W.: BIND: the Biomolecular Interaction Network Database. Nucleic Acids Research\u00a031(1), 248\u2013250 (2003)","journal-title":"Nucleic Acids Research"},{"issue":"1","key":"9_CR9","doi-asserted-by":"publisher","first-page":"242","DOI":"10.1093\/nar\/29.1.242","volume":"29","author":"G.D. Bader","year":"2001","unstructured":"Bader, G.D., Donaldson, I., Wolting, C., Ouellette, B.F., Pawson, T., Hogue, C.W.: BINDThe Biomolecular Interaction Network Database. Nucleic Acids Research\u00a029(1), 242\u2013245 (2001)","journal-title":"Nucleic Acids Research"},{"issue":"5","key":"9_CR10","doi-asserted-by":"publisher","first-page":"465","DOI":"10.1093\/bioinformatics\/16.5.465","volume":"16","author":"G.D. Bader","year":"2000","unstructured":"Bader, G.D., Hogue, C.V.W.: BINDa data specification for storing and describing biomolecular interactions, molecular complexes and pathways. Bioinformatics\u00a016(5), 465\u2013477 (2000)","journal-title":"Bioinformatics"},{"key":"9_CR11","doi-asserted-by":"publisher","first-page":"2363","DOI":"10.1101\/gr.1680803","volume":"13","author":"S. Peri","year":"2003","unstructured":"Peri, S., Navarro, J.D., Amanchy, R., Kristiansen, T.Z., Jonnalagadda, C.K., Surendranath, V., Niranjan, V., Muthusamy, B., Gandhi, T.K., Gronborg, M., Ibarrola, N., Deshpande, N., Shanker, K., Shivashankar, H.N., Rashmi, B.P., Ramya, M.A., Zhao, Z., Chandrika, K.N., Padma, N., Harsha, H.C., Yatish, A.J., Kavitha, M.P., Menezes, M., Choudhury, D.R., Suresh, S., Ghosh, N., Saravana, R., Chandran, S., Krishna, S., Joy, M., Anand, S.K., Madavan, V., Joseph, A., Wong, G.W., Schiemann, W.P., Constantinescu, S.N., Huang, L., Khosravi-Far, R., Steen, H., Tewari, M., Ghaffari, S., Blobe, G.C., Dang, C.V., Garcia, J.G., Pevsner, J., Jensen, O.N., Roepstorff, P., Deshpande, K.S., Chinnaiyan, A.M., Hamosh, A., Chakravarti, A., Pandey, A.: Development of human protein reference database as an initial platform for approaching systems biology in humans. Genome Research\u00a013, 2363\u20132371 (2003)","journal-title":"Genome Research"},{"key":"9_CR12","unstructured":"Mishra, G., Suresh, M., Kumaran, K., Kannabiran, N., Suresh, S., Bala, P., Shivkumar, K., Anuradha, N., Reddy, R., Raghavan, T.M., Menon, S., Hanumanthu, G., Gupta, M., Upendran, S., Gupta, S., Mahesh, M., Jacob, B., Matthew, P., Chatterjee, P., Arun, K.S., Sharma, S., Chandrika, K.N., Deshpande, N., Palvankar, K., Raghavnath, R., Krishnakanth, K., Karathia, H., Rekha, B., Rashmi, N.S., Vishnupriya, G., Kumar, H.G.M., Nagini, M., Kumar, G.S.S., Jose, R., Deepthi, P., Mohan, S.S., Gandhi, T.K.B., Harsha, H.C., Deshpande, K.S., Sarker, M., Prasad, T.S.K., Pandey, A.: Human Protein Reference Database - 2006 Update. Nucleic Acids Research\u00a034, D411\u2013D414 (2006)"},{"key":"9_CR13","doi-asserted-by":"crossref","unstructured":"Chatr-aryamontri, A., Ceol, A., Palazzi, L.M., Nardelli, G., Schneider, M.V., Castagnoli, L., Cesareni, G.: MINT: the Molecular INTeraction database. Nucleic Acids Research\u00a035(Database issue), D572\u2013D574 (2007)","DOI":"10.1093\/nar\/gkl950"},{"key":"9_CR14","unstructured":"Munich Information Center for Protein Sequences (MIPS), http:\/\/mips.gsf.de"},{"key":"9_CR15","doi-asserted-by":"crossref","first-page":"D561","DOI":"10.1093\/nar\/gkl958","volume":"35","author":"S. Kerrien","year":"2007","unstructured":"Kerrien, S., Alam-Faruque, Y., Aranda, B., Bancarz, I., Bridge, A., Derow, C., Dimmer, E., Feuermann, M., Friedrichsen, A., Huntley, R., Kohler, C., Khadake, J., Leroy, C., Liban, A., Lieftink, C., Montecchi-Palazzi, L., Orchard, S., Risse, J., Robbe, K., Roechert, B., Thorneycroft, D., Zhang, Y., Apweiler, R., Hermjakob, H.: IntAct Open Source Resource for Molecular Interaction Data. Nucleic Acids Research 35(Database issue), D561\u2013D565 (2007)","journal-title":"Nucleic Acids Research"},{"key":"9_CR16","doi-asserted-by":"crossref","first-page":"D452","DOI":"10.1093\/nar\/gkh052","volume":"32","author":"H. Hermjakob","year":"2004","unstructured":"Hermjakob, H., Montecchi-Palazzi, L., Lewington, C., Mudali, S., Kerrien, S., Orchard, S., Vingron, M., Roechert, B., Roepstorff, P., Valencia, A., Margalit, H., Armstrong, J., Bairoch, A., Cesareni, G., Sherman, D., Apweiler, R.: IntAct: an open source molecular interaction database. Nucleic Acids Research\u00a032(Database issue), D452\u2013D455 (2004)","journal-title":"Nucleic Acids Research"},{"issue":"Database issue","key":"9_CR17","doi-asserted-by":"publisher","first-page":"449","DOI":"10.1093\/nar\/gkh086","volume":"32","author":"L. Salwinski","year":"2004","unstructured":"Salwinski, L., Miller, C.S., Smith, A.J., Pettit, F.K., Bowie, J.U., Eisenberg, D.: The Database of Interacting Proteins: 2004 update. NAR\u00a032(Database issue), 449\u2013451 (2004)","journal-title":"NAR"},{"key":"9_CR18","doi-asserted-by":"publisher","first-page":"76","DOI":"10.1016\/j.cbpa.2003.12.004","volume":"8","author":"R. Apweiler","year":"2004","unstructured":"Apweiler, R., Bairoch, A., Wu, C.H.: Protein sequence databases. Current Opinion in Chemical Biology\u00a08, 76\u201380 (2004)","journal-title":"Current Opinion in Chemical Biology"},{"key":"9_CR19","unstructured":"INSDC: International Nucleotide Sequence Database Collaboration, http:\/\/www.insdc.org"},{"key":"9_CR20","doi-asserted-by":"publisher","first-page":"1971","DOI":"10.1101\/gr.206701","volume":"11","author":"R. Mrowka","year":"2001","unstructured":"Mrowka, R., Patzak, A., Herzel, H.: Is There a Bias in Proteome Research? Genome Research\u00a011, 1971\u20131973 (2001)","journal-title":"Genome Research"},{"key":"9_CR21","unstructured":"The Cancer Cell Map, http:\/\/www.cellmap.org"},{"key":"9_CR22","unstructured":"Lochovsky, L.: An Entity Resolution Framework for Deduplicating Proteins. MSc thesis. University of Toronto (2008)"},{"key":"9_CR23","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"124","DOI":"10.1007\/3-540-45876-X_10","volume-title":"Advances in Database Technology - EDBT 2002","author":"M.L. Lee","year":"2002","unstructured":"Lee, M.L., Ling, T.W., Low, W.L.: Designing Functional Dependencies for XML. In: Jensen, C.S., Jeffery, K.G., Pokorn\u00fd, J., \u0160altenis, S., Bertino, E., B\u00f6hm, K., Jarke, M. (eds.) EDBT 2002. LNCS, vol.\u00a02287, pp. 124\u2013141. Springer, Heidelberg (2002)"},{"key":"9_CR24","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1111\/j.1574-6968.1999.tb13575.x","volume":"174","author":"T.A. Tatusova","year":"1999","unstructured":"Tatusova, T.A., Madden, T.L.: Blast 2 sequences - a new tool for comparing protein and nucleotide sequences. FEMS Microbiol Lett.\u00a0174, 247\u2013250 (1999)","journal-title":"FEMS Microbiol Lett."},{"issue":"3","key":"9_CR25","doi-asserted-by":"publisher","first-page":"171","DOI":"10.1145\/363958.363994","volume":"7","author":"F.J. Damerau","year":"1964","unstructured":"Damerau, F.J.: A technique for computer detection and correction of spelling errors. Communications of the ACM\u00a07(3), 171\u2013176 (1964)","journal-title":"Communications of the ACM"},{"key":"9_CR26","first-page":"707","volume":"10","author":"V.I. Levenshtein","year":"1966","unstructured":"Levenshtein, V.I.: Binary codes capable of correcting deletions, insertions, and reversals. Soviet Physics Doklady\u00a010, 707 (1966)","journal-title":"Soviet Physics Doklady"},{"key":"9_CR27","volume-title":"Data Mining: Concepts and Techniques","author":"J. Han","year":"2001","unstructured":"Han, J., Kamber, M.: Data Mining: Concepts and Techniques. Morgan Kaufman, Burlington (2001)"}],"container-title":["Lecture Notes in Computer Science","Data Integration in the Life Sciences"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-69828-9_9.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,11,19]],"date-time":"2020-11-19T05:03:02Z","timestamp":1605762182000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-69828-9_9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"ISBN":["9783540698272","9783540698289"],"references-count":27,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-69828-9_9","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[]}}