{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T03:08:50Z","timestamp":1742958530894,"version":"3.40.3"},"publisher-location":"Berlin, Heidelberg","reference-count":41,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642356469"},{"type":"electronic","value":"9783642356476"}],"license":[{"start":{"date-parts":[[2013,1,1]],"date-time":"2013-01-01T00:00:00Z","timestamp":1356998400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2013,1,1]],"date-time":"2013-01-01T00:00:00Z","timestamp":1356998400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2013]]},"DOI":"10.1007\/978-3-642-35647-6_10","type":"book-chapter","created":{"date-parts":[[2013,1,11]],"date-time":"2013-01-11T06:28:44Z","timestamp":1357885724000},"page":"131-143","source":"Crossref","is-referenced-by-count":2,"title":["Author Disambiguation in the YADDA2 Software Platform"],"prefix":"10.1007","author":[{"given":"Piotr Jan","family":"Dendek","sequence":"first","affiliation":[]},{"given":"Mariusz","family":"Wojew\u00f3dzki","sequence":"additional","affiliation":[]},{"given":"\u0141ukasz","family":"Bolikowski","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"10_CR1","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1145\/1014052.1014058","volume-title":"Proceedings of the 2004 ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD 2004","author":"E. Agichtein","year":"2004","unstructured":"Agichtein, E., Ganti, V.: Mining reference tables for automatic text segmentation. In: Proceedings of the 2004 ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD 2004, p. 20. ACM Press, New York (2004), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=1014052.1014058"},{"key":"10_CR2","unstructured":"Aono, M., Seddiqui, M.H.: Scalability in ontology instance matching of large semantic knowledge base. In: AIKED 2010 Proceedings of the 9th WSEAS International Conference on Artificial Intelligence, Knowledge Engineering and Data Bases, pp. 378\u2013383 (2010)"},{"issue":"6","key":"10_CR3","doi-asserted-by":"crossref","first-page":"680","DOI":"10.5858\/2003-127-680-CMDS","volume":"127","author":"J.J. Berman","year":"2003","unstructured":"Berman, J.J.: Concept-Match Medical Data Scrubbing. Archives of Pathology & Laboratory Medicine\u00a0127(6), 680\u2013686 (2003)","journal-title":"Archives of Pathology & Laboratory Medicine"},{"key":"10_CR4","unstructured":"Bolikowski, L., Dendek, P.J.: Towards a Flexible Author Name Disambiguation Framework. In: Sojka, P., Bouche, T. (eds.) Towards a Digital Mathematics Library, pp. 27\u201337. Masaryk University Press (2011)"},{"key":"10_CR5","doi-asserted-by":"publisher","first-page":"175","DOI":"10.1145\/375663.375682","volume-title":"Proceedings of the 2001 ACM SIGMOD International Conference on Management of Data, SIGMOD 2001","author":"V. Borkar","year":"2001","unstructured":"Borkar, V., Deshmukh, K., Sarawagi, S.: Automatic segmentation of text into structured records. In: Proceedings of the 2001 ACM SIGMOD International Conference on Management of Data, SIGMOD 2001, pp. 175\u2013186. ACM Press, New York (2001), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=375663.375682"},{"key":"10_CR6","doi-asserted-by":"publisher","first-page":"475","DOI":"10.1145\/775047.775116","volume-title":"Proceedings of the Eighth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD 2002","author":"W.W. Cohen","year":"2002","unstructured":"Cohen, W.W., Richman, J.: Learning to match and cluster large high-dimensional data sets for data integration. In: Proceedings of the Eighth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD 2002, p. 475. ACM Press, New York (2002), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=775047.775116"},{"key":"10_CR7","unstructured":"Culotta, A., Kanani, P., Hall, R., Wick, M., McCallum, A.: Author Disambiguation using Error-driven Machine Learning with a Ranking Loss Function. In: Sixth International Workshop on Information Integration on the Web (2007)"},{"key":"10_CR8","unstructured":"Dai, A.M., Storkey, A.J.: Author Disambiguation: A Nonparametric Topic and Co-authorship Model. In: NIPS Workshop on Applications for Topic Models Text and Beyond, pp. 1\u20134 (2009)"},{"key":"10_CR9","doi-asserted-by":"crossref","unstructured":"Dendek, P.J., Bolikowski, L.: Evaluation of Features for Author Name Disambiguation Using Linear Support Vector Machines. In: Proceedings of the 10th IAPR International Workshop on Document Analysis Systems, pp. 440\u2013444 (2012)","DOI":"10.1109\/DAS.2012.36"},{"issue":"1","key":"10_CR10","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TKDE.2007.250581","volume":"19","author":"A. Elmagarmid","year":"2007","unstructured":"Elmagarmid, A., Ipeirotis, P., Verykios, V.: Duplicate Record Detection: A Survey. IEEE Transactions on Knowledge and Data Engineering\u00a019(1), 1\u201316 (2007), \n                      http:\/\/ieeexplore.ieee.org\/lpdocs\/epic03\/wrapper.htm?arnumber=4016511","journal-title":"IEEE Transactions on Knowledge and Data Engineering"},{"key":"10_CR11","doi-asserted-by":"publisher","first-page":"1183","DOI":"10.1080\/01621459.1969.10501049","volume":"64","author":"I.P. Fellegi","year":"1969","unstructured":"Fellegi, I.P., Sunter, A.B.: A Theory for Record Linkage. Journal of the American Statistical Association\u00a064, 1183\u20131210 (1969)","journal-title":"Journal of the American Statistical Association"},{"key":"10_CR12","doi-asserted-by":"crossref","unstructured":"Han, H., Giles, L., Zha, H., Li, C., Tsioutsiouliklis, K.: Two supervised learning approaches for name disambiguation in author citations. In: Proceedings of the 2004 Joint ACM\/IEEE Conference on Digital Libraries - JCDL 2004, p. 296 (2004), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=996350.996419","DOI":"10.1145\/996350.996419"},{"key":"10_CR13","doi-asserted-by":"publisher","first-page":"334","DOI":"10.1145\/1065385.1065462","volume-title":"JCDL 2005: Proceedings of the 5th ACM\/IEEE-CS Joint Conference on Digital Libraries","author":"H. Han","year":"2005","unstructured":"Han, H., Zha, H., Giles, C.L.: Name disambiguation in author citations using a K-way spectral clustering method. In: JCDL 2005: Proceedings of the 5th ACM\/IEEE-CS Joint Conference on Digital Libraries, pp. 334\u2013343. ACM Press, New York (2005)"},{"issue":"1","key":"10_CR14","doi-asserted-by":"publisher","first-page":"9","DOI":"10.1023\/A:1009761603038","volume":"2","author":"M.A. Hern\u00e1ndez","year":"1998","unstructured":"Hern\u00e1ndez, M.A., Stolfo, S.J.: Real-world Data is Dirty: Data Cleansing and The Merge\/Purge Problem. Data Mining and Knowledge Discovery\u00a02(1), 9\u201337 (1998)","journal-title":"Data Mining and Knowledge Discovery"},{"issue":"4","key":"10_CR15","first-page":"599","volume":"24","author":"K. Knight","year":"1998","unstructured":"Knight, K., Graehl, J.: Machine Transliteration. Computational Linguistics\u00a024(4), 599\u2013612 (1998)","journal-title":"Computational Linguistics"},{"issue":"4","key":"10_CR16","doi-asserted-by":"publisher","first-page":"377","DOI":"10.1145\/146370.146380","volume":"24","author":"K. Kukich","year":"1992","unstructured":"Kukich, K.: Technique for automatically correcting words in text. ACM Computing Surveys\u00a024(4), 377\u2013439 (1992), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=146370.146380","journal-title":"ACM Computing Surveys"},{"key":"10_CR17","unstructured":"Levin, F.H., Heuser, C.A.: Using Genetic Programming to Evaluate the Impact of Social Network Analysis in Author Name Disambiguation. In: Laender, A.H.F., Lakshmanan, L.V.S. (eds.) Proceedings of the 4th Alberto Mendelzon International Workshop on Foundations of Data Management Buenos Aires Argentina, Citeseer, May 17-20., vol.\u00a0619 (2010), \n                      http:\/\/citeseerx.ist.psu.edu\/viewdoc\/download?doi=10.1.1.173.5987&amp;rep=rep1&amp;type=pdf\n                    , \n                      http:\/\/ceur-ws.org\/Vol-619\/paper2.pdf"},{"key":"10_CR18","doi-asserted-by":"crossref","unstructured":"Manning, C.D., Raghavan P., Sch\u00fctze, H.: Introduction to Information Retrieval (2008), \n                      http:\/\/nlp.stanford.edu\/IR-book\/html\/htmledition","DOI":"10.1017\/CBO9780511809071"},{"key":"10_CR19","unstructured":"McCallum, A., Freitag, D.: Maximum entropy Markov models for information extraction and segmentation. In: Proceedings of the Seventeenth International Conference on Machine Learning (2000), \n                      http:\/\/courses.ischool.berkeley.edu\/i290-dm\/s11\/SECURE\/gidofalvi.pdf"},{"key":"10_CR20","doi-asserted-by":"crossref","unstructured":"McCallum, A., Nigam, K., Ungar, L.H.: Efficient clustering of high-dimensional data sets with application to reference matching. In: Proceedings of the 6th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD 2000, pp. 169\u2013178. ACM Press, New York (2000), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=347090.347123\n                    , \n                      http:\/\/doi.acm.org\/10.1145\/347090.347123\n                    , \n                      http:\/\/dl.acm.org\/citation.cfm?id=347123","DOI":"10.1145\/347090.347123"},{"key":"10_CR21","unstructured":"Monge, A., Elkan, C.: An Efficient Domain-Independent Algorithm for Detecting Approximately Duplicate Database Records. In: Proc. Second ACM SIGMOD Workshop Research Issues in Data Mining and Knowledge Discovery, pp. 23\u201329 (1997)"},{"issue":"1","key":"10_CR22","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1145\/375360.375365","volume":"33","author":"G. Navarro","year":"2001","unstructured":"Navarro, G.: A guided tour to approximate string matching. ACM Computing Surveys\u00a033(1), 31\u201388 (2001), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=375360.375365","journal-title":"ACM Computing Surveys"},{"key":"10_CR23","unstructured":"Polish Technical Journal Contents, \n                      http:\/\/baztech.icm.edu.pl\/"},{"key":"10_CR24","unstructured":"Bigdata Database Webpage, \n                      http:\/\/www.systap.com\/bigdata.htm"},{"key":"10_CR25","unstructured":"Large Triple Stores Description, \n                      http:\/\/www.w3.org\/wiki\/LargeTripleStores"},{"key":"10_CR26","unstructured":"Neo4j: The World\u2019s Leading Graph Database, \n                      http:\/\/www.w3.org\/wiki\/LargeTripleStores"},{"key":"10_CR27","unstructured":"Semame Database Webpage, \n                      http:\/\/www.openrdf.org\/"},{"key":"10_CR28","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/1579114.1579121","volume-title":"Proceedings of the 2nd International Conference on PErvsive Technologies Related to Assistive Environments - PETRA 2009","author":"K. Park","year":"2009","unstructured":"Park, K., Becker, E., Vinjumur, J.K., Le, Z., Makedon, F.: Human behavioral detection and data cleaning in assisted living environment using wireless sensor networks. In: Proceedings of the 2nd International Conference on PErvsive Technologies Related to Assistive Environments - PETRA 2009, pp. 1\u20138. ACM Press, New York (2009), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=1579114.1579121"},{"issue":"6","key":"10_CR29","first-page":"38","volume":"18","author":"L. Philips","year":"2000","unstructured":"Philips, L.: The double metaphone search algorithm. C\/C++ Users Journal\u00a018(6), 38\u201343 (2000)","journal-title":"C\/C++ Users Journal"},{"key":"10_CR30","doi-asserted-by":"crossref","unstructured":"Qian, Y., Hu, Y., Cui, J., Zheng, Q., Nie, Z.: Combining Machine Learning and Human Judgment in Author Disambiguation Framework. In: Proceedings of the 20th ACM International Conference on Information and Knowledge Management, pp. 1241\u20131246. ACM Press (2011), \n                      http:\/\/research.microsoft.com\/pubs\/154452\/CIKM_CameraReady.pdf","DOI":"10.1145\/2063576.2063756"},{"key":"10_CR31","unstructured":"Raman, V.: Potter\u2019s wheel: An interactive data cleaning system. In: International Conference on Very Large Data (2001), \n                      http:\/\/www.vldb.org\/conf\/2001\/P381.pdf"},{"issue":"5","key":"10_CR32","doi-asserted-by":"publisher","first-page":"522","DOI":"10.1109\/34.682181","volume":"20","author":"E. Ristad","year":"1998","unstructured":"Ristad, E., Yianilos, P.: Learning string-edit distance. IEEE Transactions on Pattern Analysis and Machine Intelligence\u00a020(5), 522\u2013532 (1998), \n                      http:\/\/ieeexplore.ieee.org\/lpdocs\/epic03\/wrapper.htm?arnumber=682181","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"10_CR33","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1145\/1015330.1015422","volume-title":"Twenty-first International Conference on Machine Learning, ICML 2004","author":"C. Sutton","year":"2004","unstructured":"Sutton, C., Rohanimanesh, K., McCallum, A.: Dynamic conditional random fields. In: Twenty-first International Conference on Machine Learning, ICML 2004, p. 99. ACM Press, New York (2004), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=1015330.1015422"},{"key":"10_CR34","doi-asserted-by":"crossref","unstructured":"Sylwestrzak, W., Rosiek, T., Bolikowski, L.: YADDA2 Assemble Your Own Digital Library Application from Lego Bricks. In: Proceedings of the 2012 ACM\/IEEE on Joint Conference on Digital Libraries (2012)","DOI":"10.1145\/2232817.2232920"},{"key":"10_CR35","doi-asserted-by":"publisher","first-page":"314","DOI":"10.1145\/1141753.1141826","volume-title":"Proceedings of the 6th ACM\/IEEE-CS Joint Conference on Digital Libraries - JCDL 2006","author":"Y.F. Tan","year":"2006","unstructured":"Tan, Y.F., Kan, M.Y., Lee, D.: Search engine driven author disambiguation. In: Proceedings of the 6th ACM\/IEEE-CS Joint Conference on Digital Libraries - JCDL 2006, p. 314. ACM Press, New York (2006), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=1141753.1141826"},{"issue":"8","key":"10_CR36","doi-asserted-by":"crossref","first-page":"607","DOI":"10.1016\/S0306-4379(01)00042-4","volume":"26","author":"S. Tejada","year":"2001","unstructured":"Tejada, S., Knoblock, C.A., Minton, S.: Learning object identification rules for information integration. Information Systems\u00a026(8), 607\u2013633 (2001), \n                      http:\/\/www.sciencedirect.com\/science\/article\/pii\/S0306437901000424\n                    , \n                      http:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0306437901000424","journal-title":"Information Systems"},{"issue":"3","key":"10_CR37","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/1552303.1552304","volume":"3","author":"V.I. Torvik","year":"2009","unstructured":"Torvik, V.I., Smalheiser, N.R.: Author name disambiguation in MEDLINE. ACM Transactions on Knowledge Discovery from Data\u00a03(3), 1\u201329 (2009), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=1552303.1552304","journal-title":"ACM Transactions on Knowledge Discovery from Data"},{"key":"10_CR38","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1145\/1012453.1012457","volume-title":"Proceedings of the 2004 International Workshop on Information Quality in Informational Systems, IQIS 2004","author":"V.S. Verykios","year":"2004","unstructured":"Verykios, V.S., Moustakides, G.V.: A generalized cost optimal decision model for record matching. In: Proceedings of the 2004 International Workshop on Information Quality in Informational Systems, IQIS 2004, p. 20. ACM Press, New York (2004), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=1012453.1012457"},{"issue":"1","key":"10_CR39","doi-asserted-by":"publisher","first-page":"28","DOI":"10.1007\/s00778-002-0072-y","volume":"12","author":"V. Verykios","year":"2003","unstructured":"Verykios, V., Moustakides, G., Elfeky, M.: A Bayesian decision model for cost optimal record matching. The VLDB Journal The International Journal on Very Large Data Bases\u00a012(1), 28\u201340 (2003), \n                      http:\/\/www.springerlink.com\/Index\/10.1007\/s00778-002-0072-y","journal-title":"The VLDB Journal The International Journal on Very Large Data Bases"},{"key":"10_CR40","first-page":"1","volume-title":"Proceedings of the 48th Annual Southeast Regional Conference on - ACM SE 2010","author":"C. Vicknair","year":"2010","unstructured":"Vicknair, C., Macias, M., Zhao, Z., Nan, X., Chen, Y., Wilkins, D.: A comparison of a graph database and a relational database. In: Proceedings of the 48th Annual Southeast Regional Conference on - ACM SE 2010, p. 1. ACM Press, New York (2010), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=1900008.1900067"},{"key":"10_CR41","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1145\/221270.221319","volume-title":"Proceedings of the Fourth International Conference on Information and Knowledge Management, CIKM 1995","author":"J. Widom","year":"1995","unstructured":"Widom, J.: Research problems in data warehousing. In: Proceedings of the Fourth International Conference on Information and Knowledge Management, CIKM 1995, pp. 25\u201330. ACM Press, New York (1995), \n                      http:\/\/portal.acm.org\/citation.cfm?doid=221270.221319"}],"container-title":["Studies in Computational Intelligence","Intelligent Tools for Building a Scientific Information Platform"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-35647-6_10","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,25]],"date-time":"2024-01-25T15:22:26Z","timestamp":1706196146000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-642-35647-6_10"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013]]},"ISBN":["9783642356469","9783642356476"],"references-count":41,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-35647-6_10","relation":{},"ISSN":["1860-949X","1860-9503"],"issn-type":[{"type":"print","value":"1860-949X"},{"type":"electronic","value":"1860-9503"}],"subject":[],"published":{"date-parts":[[2013]]}}}