{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,19]],"date-time":"2025-09-19T09:25:04Z","timestamp":1758273904462},"reference-count":35,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2016,8,8]],"date-time":"2016-08-08T00:00:00Z","timestamp":1470614400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Lang Resources &amp; Evaluation"],"published-print":{"date-parts":[[2017,9]]},"DOI":"10.1007\/s10579-016-9365-4","type":"journal-article","created":{"date-parts":[[2016,8,8]],"date-time":"2016-08-08T11:24:20Z","timestamp":1470655460000},"page":"805-832","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["MC4WEPS: a multilingual corpus for Web people search disambiguation"],"prefix":"10.1007","volume":"51","author":[{"given":"Soto","family":"Montalvo","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Raquel","family":"Mart\u00ednez","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Leonardo","family":"Campillos","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Agust\u00edn D.","family":"Delgado","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"V\u00edctor","family":"Fresno","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Felisa","family":"Verdejo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2016,8,8]]},"reference":[{"key":"9365_CR1","unstructured":"Artiles, J. (2009). Web people search. Ph.D. thesis, UNED."},{"key":"9365_CR2","unstructured":"Artiles, J., Borthwick, A., Gonzalo, J., Sekine, S., & Amig\u00f3, E. (2010). Weps-3 evaluation campaign: Overview of the web people search clustering and attribute extraction tasks. In Third Web people search evaluation forum (WePS-3)."},{"key":"9365_CR3","doi-asserted-by":"crossref","unstructured":"Artiles, J., Gonzalo, J., & Sekine, S. (2007). The semeval- 2007 weps evaluation: Establishing a benchmark for the web people search task. In Proceedings of the fourth international workshop on semantic evaluations (SemEval-2007), pp. 64\u201369. ACL.","DOI":"10.3115\/1621474.1621486"},{"key":"9365_CR4","unstructured":"Artiles, J., Gonzalo, J., & Sekine, S. (2009).Weps 2 evaluation campaign: Overview of the web people search clustering task. In Proceedings of the 2nd Web people search evaluation workshop (WePS 2009)."},{"key":"9365_CR5","unstructured":"Bagga, A., & Baldwin, B. (1998). Entity-based cross-document coreferencing using the vector space model. In Proceedings of the 36th anual meeting of the association of computational linguistics and 17th international conference on computational linguistics (Vol.\u00a01, pp. 79\u201385)."},{"key":"9365_CR6","doi-asserted-by":"crossref","unstructured":"Bekkerman, R., & McCallum, A. (2005). Disambiguating web appearances of people in a social network. In Proceedings of the 14th international World Wide Web conference (WWW 2005) (pp. 463\u2013470).","DOI":"10.1145\/1060745.1060813"},{"key":"9365_CR7","doi-asserted-by":"crossref","unstructured":"Berendsen, R., Kovachev, B., Nastou, E. P., de Rijke, M., & Weerkamp, W. (2012). Result disambiguation in web people search. In Proceedings of the 34th European conference on advances in information retrieval (ECIR2012) (pp. 146\u2013157).","DOI":"10.1007\/978-3-642-28997-2_13"},{"key":"9365_CR8","doi-asserted-by":"crossref","unstructured":"Bhowmick, P. K., Mitra, P., & Basu, A. (2008). An agreement measure for determining inter-annotator reliability of human judgements on affective text. In Proceedings of the workshop on Human Judgements in Computational Linguistics (COLING 2008) (pp. 58\u201365).","DOI":"10.3115\/1611628.1611637"},{"key":"9365_CR9","doi-asserted-by":"crossref","first-page":"2690","DOI":"10.1016\/j.eswa.2011.08.125","volume":"39","author":"Y Chen","year":"2012","unstructured":"Chen, Y., Lee, S. Y. M., & Huang, C. R. (2012). A robust web personal name information extraction system. Expert Systems with Applications, 39, 2690\u20132699.","journal-title":"Expert Systems with Applications"},{"issue":"1","key":"9365_CR10","doi-asserted-by":"crossref","first-page":"37","DOI":"10.1177\/001316446002000104","volume":"20","author":"J Cohen","year":"1960","unstructured":"Cohen, J. (1960). A coefficient of agreement for nominal scales. Educational and Psychological Measurement, 20(1), 37\u201346.","journal-title":"Educational and Psychological Measurement"},{"key":"9365_CR11","first-page":"51","volume":"53","author":"AD Delgado","year":"2014","unstructured":"Delgado, A. D., Mart\u00ednez, R., Fresno, V., & Montalvo, S. (2014a). An unsupervised algorithm for person name disambiguation in the web. Procesamiento del Lenguaje Natural, 53, 51\u201358.","journal-title":"Procesamiento del Lenguaje Natural"},{"key":"9365_CR12","unstructured":"Delgado, A. D., Mart\u00ednez, R., Montalvo, S., & Fresno, V. (2014b). A data driven approach for person name disambiguation in web search results. In Proceedings of the 25th international conference on computational linguistics (COLING 2014) (pp. 301\u2013310)."},{"issue":"1","key":"9365_CR13","doi-asserted-by":"crossref","first-page":"95","DOI":"10.1162\/089120104773633402","volume":"30","author":"B Di","year":"2004","unstructured":"Di, B., & Glass, E. M. (2004). Squibs and discussions the kappa statistic: A second look. Computational Linguistics, 30(1), 95\u2013101.","journal-title":"Computational Linguistics"},{"key":"9365_CR14","volume-title":"Statistical methods for rates and proportions","author":"JL Fleiss","year":"1981","unstructured":"Fleiss, J. L. (1981). Statistical methods for rates and proportions (2nd ed.). New York: Wiley.","edition":"2"},{"key":"9365_CR15","doi-asserted-by":"crossref","first-page":"553","DOI":"10.1080\/01621459.1983.10478008","volume":"78","author":"EB Fowlkes","year":"1983","unstructured":"Fowlkes, E. B., & Mallows, C. L. (1983). A method for comparing two hierarchical clusterings. Journal of the American Statistical Association, 78, 553\u2013569.","journal-title":"Journal of the American Statistical Association"},{"key":"9365_CR16","unstructured":"Gruetze, T., Kasneci, G., Zuo, Z., & Naumann, F. (2014). Bootstrapped grouping of results to ambiguous person name queries. In Proceedings of the 30th international conference on data engineering workshops (ICDE) (pp. 56\u201361)."},{"issue":"2\u20133","key":"9365_CR17","doi-asserted-by":"crossref","first-page":"107","DOI":"10.1023\/A:1012801612483","volume":"17","author":"M Halkidi","year":"2001","unstructured":"Halkidi, M., Batistakis, Y., & Vazirgiannis, M. (2001). On clustering validation techniques. Journal of Intelligent Information Systems, 17(2\u20133), 107\u2013145.","journal-title":"Journal of Intelligent Information Systems"},{"key":"9365_CR18","first-page":"547","volume":"37","author":"P Jaccard","year":"1901","unstructured":"Jaccard, P. (1901). \u00c9tude comparative de la distribution florale dans une portion des alpes et des jura. Bulletin del la Socit Vaudoise des Sciences Naturelles, 37, 547\u2013579.","journal-title":"Bulletin del la Socit Vaudoise des Sciences Naturelles"},{"issue":"3","key":"9365_CR19","doi-asserted-by":"crossref","first-page":"333","DOI":"10.1162\/089120103322711569","volume":"29","author":"A Kilgarriff","year":"2003","unstructured":"Kilgarriff, A., & Grefenstette, G. (2003). Web as corpus: Introduction to the special issue. Computational Linguistics, 29(3), 333\u2013347.","journal-title":"Computational Linguistics"},{"key":"9365_CR20","doi-asserted-by":"crossref","first-page":"159","DOI":"10.2307\/2529310","volume":"33","author":"JR Landis","year":"1977","unstructured":"Landis, J. R., & Koch, G. G. (1977). The measurement of observer agreement for categorical data. Biometrics, 33, 159\u2013174.","journal-title":"Biometrics"},{"key":"9365_CR21","unstructured":"Liu, V., & Curran, J.R. (2006). Web text corpus for natural language processing. In Proceedings of the 11th conference of the European chapter of the association for computational linguistics (pp. 233\u2013240)."},{"key":"9365_CR22","unstructured":"Liu, Z., Lu, Q., & Xu, J. (2011). High performance clustering forweb person name disambiguation using topic capturing. In International workshop on entity-oriented Search (EOS)."},{"key":"9365_CR23","unstructured":"Mann, G. S. (2006). Multi-document statistical fact extraction and fusion. Ph.D. thesis, Johns Hopkins University, Baltimore, MD, USA. AAI3213760"},{"key":"9365_CR24","volume-title":"Corpus-based language studies: An advanced resource book","author":"A McEnery","year":"2006","unstructured":"McEnery, A., Xiao, R., & Tono, Y. (2006). Corpus-based language studies: An advanced resource book. London: Routledge."},{"issue":"1","key":"9365_CR25","first-page":"1","volume":"37","author":"R Nuray-Turan","year":"2012","unstructured":"Nuray-Turan, R., Kalashnikov, D. V., & Mehrotra, S. (2012). Exploiting web querying for Web people search. Journal ACM Transactions on Database Systems, 37(1), 1\u201341.","journal-title":"Journal ACM Transactions on Database Systems"},{"key":"9365_CR26","unstructured":"Pedersen, T., Kulkarni, A., Angheluta, R., Kozareva, Z., & Solorio, T. (2006). An unsupervised language independent method of name discrimination using second order co-occurrence features. Computational linguistics and intelligent text processing (Vol. 3878, pp. 208\u2013222). Lecture Notes in Computer Science. Berlin, Heidelberg: Springer."},{"key":"9365_CR27","doi-asserted-by":"crossref","first-page":"846","DOI":"10.1080\/01621459.1971.10482356","volume":"66","author":"WM Rand","year":"1971","unstructured":"Rand, W. M. (1971). Objective criteria for the evaluation of clustering methods. Journal of the American Statistical Association, 66, 846\u2013850.","journal-title":"Journal of the American Statistical Association"},{"key":"9365_CR28","unstructured":"Rosell, M., Kann, V., & Litton, J.E. (2004). Comparing comparisons: Document clustering evaluation using two manual classifications. In Proceedings of the international conference on natural language processing (pp. 207\u2013216)."},{"key":"9365_CR29","doi-asserted-by":"crossref","unstructured":"Shen, D., Walker, T., Zheng, Z., Yang, Q., & Li, Y. (2008). Personal name classification in web queries. In Proceedings of the 2008 international conference on Web search and data mining (WSDM\u201908) (pp. 149\u2013158).","DOI":"10.1145\/1341531.1341553"},{"key":"9365_CR30","volume-title":"Nonparametric statistics for the behavioral sciences","author":"S Siegel","year":"1988","unstructured":"Siegel, S., & Castellan, N. J. (1988). Nonparametric statistics for the behavioral sciences (2nd ed.). New York: McGraw Hill.","edition":"2"},{"key":"9365_CR31","doi-asserted-by":"crossref","unstructured":"Vu, Q. M., Takasu, A., & Adachi, J.(2008). Name disambiguation boosted by latent topics from web directories. In Proceedings of the IEEE\/WIC\/ACM international conference on Web intelligence and intelligent agent technology (WI-IAT \u201908) (pp. 697\u2013703).","DOI":"10.1109\/WIIAT.2008.171"},{"key":"9365_CR32","doi-asserted-by":"crossref","unstructured":"Wang, X., Tang, J., Cheng, H., & Yu, P. S. (2011). Adana: Active name disambiguation. In Proceedings of the 2011 IEEE 11th international conference on data mining (ICDM\u201911) (pp. 794\u2013803).","DOI":"10.1109\/ICDM.2011.19"},{"key":"9365_CR33","volume-title":"The handbook of natural language processing, chap. corpus creation","author":"R Xiao","year":"2010","unstructured":"Xiao, R. (2010). The handbook of natural language processing, chap. corpus creation. Boca Raton: CRC Press."},{"key":"9365_CR34","doi-asserted-by":"crossref","unstructured":"Xu, J., Lu, Q., Li, M., & Li, W. (2015). Web person disambiguation using hierarchical co-reference model. In Proceedings of the 16th international conference CICLing 2015 (pp. 279\u2013291).","DOI":"10.1007\/978-3-319-18111-0_22"},{"key":"9365_CR35","doi-asserted-by":"crossref","unstructured":"Yoshida, M., Ikeda, M., Ono, S., Sato, I., & Nakagawa, H. (2010). Person name disambiguation by bootstrapping. In Proceedings of the 33rd international ACM SIGIR conference on research and development in information retrieval (SIGIR\u201910) (pp. 10\u201317).","DOI":"10.1145\/1835449.1835454"}],"container-title":["Language Resources and Evaluation"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10579-016-9365-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-016-9365-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-016-9365-4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-016-9365-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,8,4]],"date-time":"2017-08-04T10:07:38Z","timestamp":1501841258000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10579-016-9365-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,8,8]]},"references-count":35,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2017,9]]}},"alternative-id":["9365"],"URL":"https:\/\/doi.org\/10.1007\/s10579-016-9365-4","relation":{},"ISSN":["1574-020X","1574-0218"],"issn-type":[{"value":"1574-020X","type":"print"},{"value":"1574-0218","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016,8,8]]}}}