{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,8]],"date-time":"2024-09-08T10:35:38Z","timestamp":1725791738780},"publisher-location":"Berlin, Heidelberg","reference-count":25,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642549021"},{"type":"electronic","value":"9783642549038"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-642-54903-8_33","type":"book-chapter","created":{"date-parts":[[2014,4,18]],"date-time":"2014-04-18T14:47:24Z","timestamp":1397832444000},"page":"392-403","source":"Crossref","is-referenced-by-count":0,"title":["How Document Properties Affect Document Relatedness Measures"],"prefix":"10.1007","author":[{"given":"Jessica","family":"Perrie","sequence":"first","affiliation":[]},{"given":"Aminul","family":"Islam","sequence":"additional","affiliation":[]},{"given":"Evangelos","family":"Milios","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"33_CR1","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"312","DOI":"10.1007\/978-3-642-30353-1_29","volume-title":"Advances in Artificial Intelligence","author":"A. Islam","year":"2012","unstructured":"Islam, A., Milios, E., Ke\u0161elj, V.: Text similarity using google tri-grams. In: Kosseim, L., Inkpen, D. (eds.) Canadian AI 2012. LNCS, vol.\u00a07310, pp. 312\u2013317. Springer, Heidelberg (2012)"},{"issue":"5","key":"33_CR2","doi-asserted-by":"publisher","first-page":"556","DOI":"10.1016\/j.jbi.2005.12.004","volume":"39","author":"T. Bickmore","year":"2006","unstructured":"Bickmore, T., Giorgino, T.: Health dialog systems for patients and consumers. Journal of Biomedical Informatics\u00a039(5), 556\u2013571 (2006)","journal-title":"Journal of Biomedical Informatics"},{"key":"33_CR3","unstructured":"Liu, T., Liu, S., Chen, Z., Ma, W.Y.: An evaluation on feature selection for text clustering. In: Fawcett, T., Mishra, N. (eds.) Proc. 20th International Conference on Machine Learning (ICML 2003), pp. 488\u2013495. AAAI Press (August 2003)"},{"key":"33_CR4","doi-asserted-by":"crossref","first-page":"457","DOI":"10.1613\/jair.1523","volume":"22","author":"G. Erkan","year":"2004","unstructured":"Erkan, G., Radev, D.: Lexrank: Graph-based lexical centrality as salience in text summarization. Journal of Artificial Intelligence Research\u00a022, 457\u2013479 (2004)","journal-title":"Journal of Artificial Intelligence Research"},{"issue":"1","key":"33_CR5","first-page":"97","volume":"24","author":"H. Schutze","year":"1998","unstructured":"Schutze, H.: Automatic word sense discrimination. Computational Linguistics\u00a024(1), 97\u2013124 (1998)","journal-title":"Computational Linguistics"},{"key":"33_CR6","unstructured":"Wagstaff, K.L.: Chapter 1: Introduction: 1.2 Supervised Learning: Disadvantages of supervised learning (April 2007), \n                    \n                      http:\/\/www.wkiri.com\/research\/papers\/wagstaff-diss-1.ps\n                    \n                    \n                   (last accessed August 13, 2013)"},{"key":"33_CR7","unstructured":"Liu, Q., Wu, Y.: Supervised Learning (Janurary 2011), \n                    \n                      http:\/\/www.fxpal.com\/publications\/FXPAL-PR-11-626.pdf\n                    \n                    \n                   (last accessed August 13, 2013)"},{"issue":"2","key":"33_CR8","first-page":"34","volume":"2","author":"R. Sathy","year":"2013","unstructured":"Sathy, R., Abraham, A.: Comparison of Supervised and Unsupervised Learning Algorithms for Pattern Classification. International Journal of Advanced Research in Artificial Intelligence\u00a02(2), 34\u201338 (2013)","journal-title":"International Journal of Advanced Research in Artificial Intelligence"},{"key":"33_CR9","unstructured":"Islam, A., Milios, E., Ke\u0161elj, V.: Comparing Word Relatedness Measures Based on Google n-grams. In: International Conference on Computational Linguistics, pp. 495\u2013506 (December 2012)"},{"key":"33_CR10","unstructured":"Lee, M.D., Pincombe, B.M., Welsh, M.B.: An empirical evaluation of models of text document similarity. In: Proceedings of the XXVII Annual Conference of the Cognitive Science Society, Austin, Texas, USA, pp. 1254\u20131259. Cognitive Science Society (2005)"},{"key":"33_CR11","unstructured":"Thirumuruganathan, S.: A Detailed Introduction to K-Nearest Neighbor (KNN) Algorithm (May 2013), \n                    \n                      http:\/\/saravananthirumuruganathan.wordpress.com\/2010\/05\/17\/a-detailed-introduction-to-k-nearest-neighbor-knn-algorithm\/\n                    \n                    \n                   (last accessed July 30, 2013)"},{"key":"33_CR12","series-title":"IFIP","doi-asserted-by":"publisher","first-page":"169","DOI":"10.1007\/978-0-387-34747-9_18","volume-title":"Artificial Intelligence in Theory and Practice","author":"F. Colas","year":"2006","unstructured":"Colas, F., Brazdil, P.: Comparison of svm and some older classification algorithms in text classification tasks. In: Bramer, M. (ed.) Artificial Intelligence in Theory and Practice. IFIP, vol.\u00a0217, pp. 169\u2013178. Springer, Heidelberg (2006)"},{"issue":"11","key":"33_CR13","doi-asserted-by":"publisher","first-page":"613","DOI":"10.1145\/361219.361220","volume":"18","author":"G. Salton","year":"1975","unstructured":"Salton, G., Wong, A., Yang, C.S.: A vector space model for automatic indexing. Commun. ACM\u00a018(11), 613\u2013620 (1975)","journal-title":"Commun. ACM"},{"key":"33_CR14","first-page":"757","volume-title":"Proceedings of the 16th International Conference on World Wide Web, WWW 2007","author":"D. Bollegala","year":"2007","unstructured":"Bollegala, D., Matsuo, Y., Ishizuka, M.: Measuring semantic similarity between words using web search engines. In: Proceedings of the 16th International Conference on World Wide Web, WWW 2007, pp. 757\u2013766. ACM, New York (2007)"},{"key":"33_CR15","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"491","DOI":"10.1007\/3-540-44795-4_42","volume-title":"Machine Learning: ECML 2001","author":"P.D. Turney","year":"2001","unstructured":"Turney, P.D.: Mining the web for synonyms: PMI-IR versus LSA on TOEFL. In: Flach, P.A., De Raedt, L. (eds.) ECML 2001. LNCS (LNAI), vol.\u00a02167, pp. 491\u2013502. Springer, Heidelberg (2001)"},{"issue":"13","key":"33_CR16","doi-asserted-by":"publisher","first-page":"13","DOI":"10.5120\/11638-7118","volume":"68","author":"W.H. Gomaa","year":"2013","unstructured":"Gomaa, W.H., Fahmy, A.A.: A survey of text similarity approaches. International Journal of Computer Applications\u00a068(13), 13\u201318 (2013)","journal-title":"International Journal of Computer Applications"},{"key":"33_CR17","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"175","DOI":"10.1007\/978-3-540-70939-8_16","volume-title":"Computational Linguistics and Intelligent Text Processing","author":"M.. A. Islam","year":"2007","unstructured":"Islam, M. A., Inkpen, D.Z., Kiringa, I.: A generalized approach to word segmentation using\u00a0maximum length descending frequency and\u00a0entropy rate. In: Gelbukh, A. (ed.) CICLing 2007. LNCS, vol.\u00a04394, pp. 175\u2013185. Springer, Heidelberg (2007)"},{"key":"33_CR18","unstructured":"Oza, N.: SIAM 2007 Text Mining Competition dataset (September 2010), \n                    \n                      https:\/\/c3.nasa.gov\/dashlink\/resources\/138\/\n                    \n                    \n                   (last accessed May 30, 2013)"},{"key":"33_CR19","unstructured":"Berry, M.W.: Automating the Detection of Anomalies and Trends from Text (2007), \n                    \n                      http:\/\/citeseerx.ist.psu.edu\/viewdoc\/download?rep=rep1&type=pdf&doi=10.1.1.132.751\n                    \n                    \n                   (last accessed August 23, 2013)"},{"key":"33_CR20","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"463","DOI":"10.1007\/978-3-642-32115-3_55","volume-title":"Rough Sets and Current Trends in Computing","author":"R. Kiros","year":"2012","unstructured":"Kiros, R., Soto, A.J., Milios, E., Keselj, V.: Representation learning for sparse, high dimensional multi-label classification. In: Yao, J., Yang, Y., S\u0142owi\u0144ski, R., Greco, S., Li, H., Mitra, S., Polkowski, L. (eds.) RSCTC 2012. LNCS, vol.\u00a07413, pp. 463\u2013470. Springer, Heidelberg (2012)"},{"key":"33_CR21","doi-asserted-by":"crossref","unstructured":"Bliznakov, Z., Stavrianou, K., Pallikarakis, N.: Medical devices recalls analysis focusing on software failures during the last decade. In: Roa Romero, L.M. (ed.) XIII Mediterranean Conference on Medical and Biological Engineering and Computing 2013. IFMBE Proceedings, vol.\u00a041, pp. 1174\u20131177. Springer International Publishing (2014)","DOI":"10.1007\/978-3-319-00846-2_291"},{"key":"33_CR22","unstructured":"BHL consortium: About (June 2013), \n                    \n                      http:\/\/biodivlib.wikispaces.com\/About\n                    \n                    \n                   (last accessed August 7, 2013)"},{"key":"33_CR23","unstructured":"BHL consortium: Download All File Types and Descriptions (August 2010), \n                    \n                      http:\/\/biodivlib.wikispaces.com\/Download+All+File+Types+and+Descriptions\n                    \n                    \n                   (last accessed August 13, 2013)"},{"key":"33_CR24","unstructured":"Lewis, D.D.: RCV1-v2\/LYRL2004: The LYRL2004 Distribution of the RCV1-v2 Text Categorization Test Collection (April 12 2004 Version) (April 2004), \n                    \n                      http:\/\/www.ai.mit.edu\/projects\/jmlr\/papers\/volume5\/lewis04a\/lyrl2004_rcv1v2_README.htm\n                    \n                    \n                   (last accessed August 12, 2013)"},{"issue":"6","key":"33_CR25","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1177\/875647939000600106","volume":"1","author":"R. Taylor","year":"1990","unstructured":"Taylor, R.: Interpretation of the correlation coefficient: A basic review. Journal of Diagnostic Medical Sonography\u00a01(6), 35\u201339 (1990)","journal-title":"Journal of Diagnostic Medical Sonography"}],"container-title":["Lecture Notes in Computer Science","Computational Linguistics and Intelligent Text Processing"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-54903-8_33","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,26]],"date-time":"2019-05-26T12:30:56Z","timestamp":1558873856000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-54903-8_33"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783642549021","9783642549038"],"references-count":25,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-54903-8_33","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2014]]}}}