{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,9]],"date-time":"2025-07-09T23:02:47Z","timestamp":1752102167921},"reference-count":51,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2008,9,10]],"date-time":"2008-09-10T00:00:00Z","timestamp":1221004800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Mach Learn"],"published-print":{"date-parts":[[2009,2]]},"DOI":"10.1007\/s10994-008-5082-6","type":"journal-article","created":{"date-parts":[[2008,9,9]],"date-time":"2008-09-09T14:58:15Z","timestamp":1220972295000},"page":"133-158","source":"Crossref","is-referenced-by-count":10,"title":["Matrix representations, linear transformations, and\u00a0kernels for disambiguation in natural language"],"prefix":"10.1007","volume":"74","author":[{"given":"Tapio","family":"Pahikkala","sequence":"first","affiliation":[]},{"given":"Sampo","family":"Pyysalo","sequence":"additional","affiliation":[]},{"given":"Jorma","family":"Boberg","sequence":"additional","affiliation":[]},{"given":"Jouni","family":"J\u00e4rvinen","sequence":"additional","affiliation":[]},{"given":"Tapio","family":"Salakoski","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2008,9,10]]},"reference":[{"key":"5082_CR1","doi-asserted-by":"crossref","unstructured":"Bentivogli, L., Forner, P., Magnini, B., & Pianta, E. (2004). Revising wordnet domains hierarchy: Semantics, coverage, and balancing. In G.\u00a0S\u00e9rasset, S.\u00a0Armstrong, C.\u00a0Boitet, A.\u00a0Popescu-Belis, & D.\u00a0Tufis (Eds.), COLING 2004 workshop on multilingual linguistic resources (pp.\u00a0101\u2013108), Geneva, Switzerland.","DOI":"10.3115\/1706238.1706254"},{"key":"5082_CR2","first-page":"1059","volume":"3","author":"N. Cancedda","year":"2003","unstructured":"Cancedda, N., Gaussier, E., Goutte, C., & Renders, J.-M. (2003). Word-sequence kernels. Journal of Machine Learning Research, 3, 1059\u20131082.","journal-title":"Journal of Machine Learning Research"},{"key":"5082_CR3","first-page":"89","volume-title":"Proceedings of CoNLL-2004","author":"X. Carreras","year":"2004","unstructured":"Carreras, X., & M\u00e0rques, L. (2004). Introduction to the conll-2004 shared task: semantic role labeling. In Proceedings of CoNLL-2004 (pp.\u00a089\u201397). Boston: Association for Computational Linguistics."},{"key":"5082_CR4","doi-asserted-by":"crossref","first-page":"152","DOI":"10.3115\/1706543.1706571","volume-title":"Proceedings of the ninth conference on computational natural language learning (CoNLL-2005)","author":"X. Carreras","year":"2005","unstructured":"Carreras, X., & M\u00e0rquez, L. (2005). Introduction to the CoNLL-2005 shared task: semantic role labeling. In Proceedings of the ninth conference on computational natural language learning (CoNLL-2005) (pp.\u00a0152\u2013164). Ann Arbor: Association for Computational Linguistics."},{"key":"5082_CR5","doi-asserted-by":"crossref","unstructured":"Collins, M., & Duffy, N. (2001). Convolution kernels for natural language.","DOI":"10.7551\/mitpress\/1120.003.0085"},{"key":"5082_CR6","volume-title":"Advances in neural information processing systems\u00a016","author":"C. Cortes","year":"2004","unstructured":"Cortes, C., & Mohri, M. (2004). Auc optimization vs. error rate minimization. In S. Thrun, L. Saul, & B.\u00a0Sch\u00f6lkopf (Eds.), Advances in neural information processing systems\u00a016. Cambridge: MIT Press."},{"issue":"2\u20133","key":"5082_CR7","doi-asserted-by":"crossref","first-page":"127","DOI":"10.1023\/A:1013625426931","volume":"18","author":"N. Cristianini","year":"2002","unstructured":"Cristianini, N., Shawe-Taylor, J., & Lodhi, H. (2002). Latent semantic kernels. Journal of Intelligent Information Systems, 18(2\u20133), 127\u2013152.","journal-title":"Journal of Intelligent Information Systems"},{"key":"5082_CR8","unstructured":"Cumby, C. M., & Roth, D. (2002). Learning with feature description logics. In Proceedings of the 12th international conference on inductive logic programming."},{"key":"5082_CR9","unstructured":"Cumby, C. M., & Roth, D. (2003a). Feature extraction languages for propositionalized relational learning. In Proceedings of the IJCAI\u201903 workshop on learning statistical models from relational data."},{"key":"5082_CR10","first-page":"107","volume-title":"Proceedings of the twentieth international conference on machine learning","author":"C. M. Cumby","year":"2003","unstructured":"Cumby, C. M., & Roth, D. (2003b). On kernel methods for relational learning. In T. Fawcett & N. Mishra (Eds.), Proceedings of the twentieth international conference on machine learning (pp.\u00a0107\u2013114). Menlo Park: AAAI Press."},{"issue":"6","key":"5082_CR11","doi-asserted-by":"crossref","first-page":"391","DOI":"10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9","volume":"41","author":"S. C. Deerwester","year":"1990","unstructured":"Deerwester, S. C., Dumais, S. T., Landauer, T. K., Furnas, G. W., & Harshman, R. A. (1990). Indexing by latent semantic analysis. Journal of the American Society of Information Science, 41(6), 391\u2013407.","journal-title":"Journal of the American Society of Information Science"},{"key":"5082_CR12","unstructured":"Fawcett, T. (2003). Roc graphs: notes and practical considerations for data mining researchers (Technical Report HPL-2003-4). HP Labs, Palo Alto, CA."},{"key":"5082_CR13","doi-asserted-by":"crossref","unstructured":"G\u00e4rtner, T., Flach, P. A., & Wrobel, S. (2003). On graph kernels: hardness results and efficient alternatives. In COLT (pp.\u00a0129\u2013143).","DOI":"10.1007\/978-3-540-45167-9_11"},{"issue":"3","key":"5082_CR14","doi-asserted-by":"crossref","first-page":"205","DOI":"10.1023\/B:MACH.0000039777.23772.30","volume":"57","author":"T. G\u00e4rtner","year":"2004","unstructured":"G\u00e4rtner, T., Lloyd, J. W., & Flach, P. A. (2004). Kernels and distances for structured data. Machine Learning, 57(3), 205\u2013232.","journal-title":"Machine Learning"},{"key":"5082_CR15","first-page":"605","volume":"5","author":"F. Ginter","year":"2004","unstructured":"Ginter, F., Boberg, J., J\u00e4rvinen, J., & Salakoski, T. (2004). New techniques for disambiguation in natural language and their application to biological text. Journal of Machine Learning Research, 5, 605\u2013621.","journal-title":"Journal of Machine Learning Research"},{"key":"5082_CR16","first-page":"403","volume-title":"Proceedings of the 43rd annual meeting of the association for computational linguistics (ACL\u201905)","author":"A. Gliozzo","year":"2005","unstructured":"Gliozzo, A., Giuliano, C., & Strapparava, C. (2005). Domain kernels for word sense disambiguation. In Proceedings of the 43rd annual meeting of the association for computational linguistics (ACL\u201905) (pp.\u00a0403\u2013410). Ann Arbor: Association for Computational Linguistics."},{"key":"5082_CR17","doi-asserted-by":"crossref","first-page":"107","DOI":"10.1023\/A:1007545901558","volume":"34","author":"A. R. Golding","year":"1999","unstructured":"Golding, A. R., & Roth, D. (1999). A winnow-based approach to context-sensitive spelling correction. Machine Learning, 34, 107\u2013130.","journal-title":"Machine Learning"},{"key":"5082_CR18","unstructured":"Haussler, D. (1999). Convolution kernels on discrete structures (Technical Report UCS-CRL-99-10). University of California at Santa Cruz."},{"key":"5082_CR19","series-title":"Lecture notes in computer science","doi-asserted-by":"crossref","first-page":"137","DOI":"10.1007\/BFb0026683","volume-title":"Proceedings of the tenth European conference on machine learning","author":"T. Joachims","year":"1998","unstructured":"Joachims, T. (1998). Text categorization with support vector machines: learning with many relevant features. In C. N\u00e9dellec & C. Rouveirol (Eds.), Lecture notes in computer science : Vol.\u00a01398. Proceedings of the tenth European conference on machine learning (pp. 137\u2013142), Chemnitz, Germany, 1998. Heidelberg: Springer."},{"key":"5082_CR20","series-title":"Kluwer international series in engineering and computer science","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4615-0907-3","volume-title":"Learning to classify text using support vector machines: methods, theory and algorithms","author":"T. Joachims","year":"2002","unstructured":"Joachims, T. (2002). Kluwer international series in engineering and computer science: Vol.\u00a0668. Learning to classify text using support vector machines: methods, theory and algorithms. Norwell: Kluwer Academic."},{"key":"5082_CR21","volume-title":"Speech and language processing: an introduction to natural language processing, computational linguistics, and speech recognition","author":"D. Jurafsky","year":"2000","unstructured":"Jurafsky, D., & Martin, J. H. (2000). Speech and language processing: an introduction to natural language processing, computational linguistics, and speech recognition. Upper Saddle River: Prentice Hall PTR."},{"key":"5082_CR22","first-page":"657","volume-title":"Advances in neural information processing systems\u00a015","author":"J. Kandola","year":"2003","unstructured":"Kandola, J., Shawe-Taylor, J., & Cristianini, N. (2003). Learning semantic similarity. In S. T. Becker & K.\u00a0Obermayer (Eds.), Advances in neural information processing systems\u00a015 (pp.\u00a0657\u2013664). Cambridge: MIT Press."},{"issue":"1\u20133","key":"5082_CR23","doi-asserted-by":"crossref","first-page":"423","DOI":"10.1023\/A:1012491419635","volume":"46","author":"E. Leopold","year":"2002","unstructured":"Leopold, E., & Kindermann, J. (2002). Text categorization with support vector machines. How to represent texts in input space? Machine Learning, 46(1\u20133), 423\u2013444.","journal-title":"Machine Learning"},{"key":"5082_CR24","first-page":"519","volume-title":"Proceedings of the eighteenth international joint conference on artificial intelligence","author":"C. X. Ling","year":"2003","unstructured":"Ling, C. X., Huang, J., & Zhang, H. (2003). Auc: a statistically consistent and more discriminating measure than accuracy. In G. Gottlob & T. Walsh (Eds.), Proceedings of the eighteenth international joint conference on artificial intelligence (pp.\u00a0519\u2013526). San Mateo: Morgan Kaufmann."},{"key":"5082_CR25","first-page":"419","volume":"2","author":"H. Lodhi","year":"2002","unstructured":"Lodhi, H., Saunders, C., Shawe-Taylor, J., Cristianini, N., & Watkins, C. (2002). Text classification using string kernels. Journal of Machine Learning Research, 2, 419\u2013444.","journal-title":"Journal of Machine Learning Research"},{"key":"5082_CR26","first-page":"1413","volume-title":"Second international conference on language resources and evaluation (LREC-2000)","author":"B. Magnini","year":"2000","unstructured":"Magnini, B., & Cavagli\u00e0, G. (2000). Integrating subject field codes into WordNet. In Second international conference on language resources and evaluation (LREC-2000) (pp.\u00a01413\u20131418). Athens: European Language Resources Association."},{"key":"5082_CR27","volume-title":"Linear structures","author":"J. R. Magnus","year":"1988","unstructured":"Magnus, J. R. (1988). Linear structures. London: Griffin."},{"key":"5082_CR28","doi-asserted-by":"crossref","DOI":"10.1137\/1.9780898719512","volume-title":"Matrix analysis and applied linear algebra","author":"C. D. Meyer","year":"2000","unstructured":"Meyer, C. D. (2000). Matrix analysis and applied linear algebra. Philadelphia: Society for Industrial and Applied Mathematics."},{"issue":"1","key":"5082_CR29","doi-asserted-by":"crossref","first-page":"157","DOI":"10.1186\/1471-2105-6-157","volume":"6","author":"T. Pahikkala","year":"2005","unstructured":"Pahikkala, T., Ginter, F., Boberg, J., J\u00e4rvinen, J., & Salakoski, T. (2005a). Contextual weighting for support vector machines in literature mining: an application to gene versus protein name disambiguation. BMC Bioinformatics, 6(1), 157.","journal-title":"BMC Bioinformatics"},{"key":"5082_CR30","first-page":"90","volume-title":"Proceedings of the international and interdisciplinary conference on adaptive knowledge representation and reasoning","author":"T. Pahikkala","year":"2005","unstructured":"Pahikkala, T., Pyysalo, S., Boberg, J., Myll\u00e4ri, A., & Salakoski, T. (2005b). Improving the performance of Bayesian and support vector classifiers in word sense disambiguation using positional information. In T. Honkela, V. K\u00f6n\u00f6nen, M. P\u00f6ll\u00e4, & O. Simula (Eds.), Proceedings of the international and interdisciplinary conference on adaptive knowledge representation and reasoning (pp.\u00a090\u201397). Espoo: Helsinki University of Technology."},{"key":"5082_CR31","first-page":"442","volume-title":"Proceedings of the eighteenth international Florida artificial intelligence research society conference","author":"T. Pahikkala","year":"2005","unstructured":"Pahikkala, T., Pyysalo, S., Ginter, F., Boberg, J., J\u00e4rvinen, J., & Salakoski, T. (2005c). Kernels incorporating word positional information in natural language disambiguation tasks. In I. Russell & Z. Markov (Eds.), Proceedings of the eighteenth international Florida artificial intelligence research society conference (pp. 442\u2013447), Clearwater Beach, FL. Menlo Park: AAAI Press."},{"key":"5082_CR32","series-title":"Lecture notes in computer science","doi-asserted-by":"crossref","first-page":"399","DOI":"10.1007\/11816508_41","volume-title":"Proceedings of the 5th international conference on NLP (FinTAL 2006)","author":"T. Pahikkala","year":"2006","unstructured":"Pahikkala, T., Boberg, J., Myll\u00e4ri, A., & Salakoski, T. (2006a). Incorporating external information in Bayesian classifiers via linear feature transformations. In T. Salakoski, F. Ginter, S. Pyysalo, & T. Pahikkala (Eds.), Lecture notes in computer science: Vol.\u00a04139. Proceedings of the 5th international conference on NLP (FinTAL 2006) (pp.\u00a0399\u2013410). Heidelberg: Springer."},{"key":"5082_CR33","first-page":"83","volume-title":"Proceedings of the ninth Scandinavian conference on artificial intelligence (SCAI 2006)","author":"T. Pahikkala","year":"2006","unstructured":"Pahikkala, T., Boberg, J., & Salakoski, T. (2006b). Fast n-fold cross-validation for regularized least-squares. In T. Honkela, T. Raiko, J. Kortela, & H. Valpola (Eds.), Proceedings of the ninth Scandinavian conference on artificial intelligence (SCAI 2006) (pp.\u00a083\u201390). Espoo: Otamedia Oy."},{"key":"5082_CR34","first-page":"445","volume-title":"ICML\u00a0\u201998: proceedings of the fifteenth international conference on machine learning","author":"F. J. Provost","year":"1998","unstructured":"Provost, F. J., Fawcett, T., & Kohavi, R. (1998). The case against accuracy estimation for comparing induction algorithms. In ICML\u00a0\u201998: proceedings of the fifteenth international conference on machine learning (pp.\u00a0445\u2013453). San Francisco: Morgan Kaufmann."},{"key":"5082_CR35","unstructured":"Rifkin, R. (2002). Everything old is new again: a fresh look at historical approaches in machine learning. PhD thesis, MIT."},{"key":"5082_CR36","series-title":"NATO science series\u00a0III: computer and system sciences","first-page":"131","volume-title":"Advances in learning theory: methods, model and applications","author":"R. Rifkin","year":"2003","unstructured":"Rifkin, R., Yeo, G., & Poggio, T. (2003). Regularized least-squares classification. In J. Suykens, G. Horvath, S. Basu, C. Micchelli, & J. Vandewalle (Eds.), NATO science series\u00a0III: computer and system sciences: Vol.\u00a0190. Advances in learning theory: methods, model and applications (pp.\u00a0131\u2013154). Amsterdam: IOS Press."},{"key":"5082_CR37","volume-title":"Proceedings of the third international conference on language resources and evaluation","author":"T. G. Rose","year":"2002","unstructured":"Rose, T. G., Stevenson, M., & Whitehead, M. (2002). The Reuters corpus volume\u00a01: from yesterday\u2019s news to tomorrow\u2019s language resources. In M. G. Rodriguez & C. P. S. Araujo (Eds.), Proceedings of the third international conference on language resources and evaluation. Paris: ELRA."},{"key":"5082_CR38","volume-title":"Learning with kernels","author":"B. Sch\u00f6lkopf","year":"2002","unstructured":"Sch\u00f6lkopf, B., & Smola, A. J. (2002). Learning with kernels. Cambridge: MIT Press."},{"key":"5082_CR39","first-page":"640","volume-title":"Advances in neural information processing systems\u00a010","author":"B. Sch\u00f6lkopf","year":"1998","unstructured":"Sch\u00f6lkopf, B., Simard, P., Smola, A., & Vapnik, V. (1998). Prior knowledge in support vector kernels. In M.\u00a0I.\u00a0Jordan, M. J. Kearns, & S. A. Solla (Eds.), Advances in neural information processing systems\u00a010 (pp.\u00a0640\u2013646). Cambridge: MIT Press."},{"key":"5082_CR40","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511809682","volume-title":"Kernel methods for pattern analysis","author":"J. Shawe-Taylor","year":"2004","unstructured":"Shawe-Taylor, J., & Cristianini, N. (2004). Kernel methods for pattern analysis. Cambridge: Cambridge University Press."},{"key":"5082_CR41","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4899-3324-9","volume-title":"Density estimation for statistics and data analysis","author":"B. W. Silverman","year":"1986","unstructured":"Silverman, B. W. (1986). Density estimation for statistics and data analysis. London: Chapman & Hall."},{"key":"5082_CR42","first-page":"205","volume-title":"Proceedings of the IEEE-Inns-Enns international joint conference on neural networks","author":"G. Siolas","year":"2000","unstructured":"Siolas, G., & d\u2019Alch\u00e9-Buc, F. (2000). Support vector machines based on a semantic kernel for text categorization. In S.-I. Amari, C. L. Giles, M. Gori, & V. Piuri (Eds.), Proceedings of the IEEE-Inns-Enns international joint conference on neural networks (pp. 205\u2013209), Como, Italy. Washington: IEEE Computer Society."},{"key":"5082_CR43","doi-asserted-by":"crossref","unstructured":"Suzuki, J., Hirao, T., Sasaki, Y., & Maeda, E. (2003). Hierarchical directed acyclic graph kernel: methods for structured natural language data.","DOI":"10.3115\/1075096.1075101"},{"key":"5082_CR44","first-page":"142","volume-title":"Proceedings of CoNLL-2003","author":"K. S. E. F. Tjong","year":"2003","unstructured":"Tjong, K. S. E. F., & De Meulder, F. (2003). Introduction to the conll-2003 shared task: language-independent named entity recognition. In W. Daelemans & M. Osborne (Eds.), Proceedings of CoNLL-2003 (pp.\u00a0142\u2013147). Edmonton: Association for Computational Linguistics."},{"key":"5082_CR45","doi-asserted-by":"crossref","unstructured":"Tsivtsivadze, E., Pahikkala, T., Boberg, J., & Salakoski, T. (2006). Locality-convolution kernel and its application to dependency parse ranking. In The 19th international conference on industrial, engineering & other applications of applied intelligent systems. Forthcoming.","DOI":"10.1007\/11779568_66"},{"key":"5082_CR46","volume-title":"Statistical learning theory","author":"V. Vapnik","year":"1998","unstructured":"Vapnik, V. (1998). Statistical learning theory. New York: Wiley."},{"key":"5082_CR47","doi-asserted-by":"crossref","unstructured":"Vishwanathan, S., Smola, A. J., & Vidal, R. (2006, to appear). Binet-Cauchy kernels on dynamical systems and its application to the analysis of dynamic scenes. International Journal of Computer Vision.","DOI":"10.1007\/s11263-006-9352-0"},{"key":"5082_CR48","doi-asserted-by":"crossref","first-page":"80","DOI":"10.2307\/3001968","volume":"1","author":"F. Wilcoxon","year":"1945","unstructured":"Wilcoxon, F. (1945). Individual comparisons by ranking methods. Biometrics, 1, 80\u201383.","journal-title":"Biometrics"},{"key":"5082_CR49","doi-asserted-by":"crossref","unstructured":"Wong, S. K. M., Ziarko, W., & Wong, P. C. N. (1985). Generalized vector space model in information retrieval. In ACM SIGIR international conference on research and development in information retrieval (pp.\u00a018\u201325).","DOI":"10.1145\/253495.253506"},{"key":"5082_CR50","doi-asserted-by":"crossref","unstructured":"Yarowsky, D. (1993). One sense per collocation. In Proceedings, ARPA human language technology workshop, Princeton.","DOI":"10.3115\/1075671.1075731"},{"key":"5082_CR51","doi-asserted-by":"crossref","unstructured":"Yarowsky, D. (1995). Unsupervised word sense disambiguation rivaling supervised methods. In Meeting of the association for computational linguistics (pp.\u00a0189\u2013196).","DOI":"10.3115\/981658.981684"}],"container-title":["Machine Learning"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10994-008-5082-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10994-008-5082-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10994-008-5082-6","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,29]],"date-time":"2024-02-29T18:00:07Z","timestamp":1709229607000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10994-008-5082-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2008,9,10]]},"references-count":51,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2009,2]]}},"alternative-id":["5082"],"URL":"https:\/\/doi.org\/10.1007\/s10994-008-5082-6","relation":{},"ISSN":["0885-6125","1573-0565"],"issn-type":[{"value":"0885-6125","type":"print"},{"value":"1573-0565","type":"electronic"}],"subject":[],"published":{"date-parts":[[2008,9,10]]}}}