{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,17]],"date-time":"2025-10-17T13:46:42Z","timestamp":1760708802281},"reference-count":47,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2015,2,28]],"date-time":"2015-02-28T00:00:00Z","timestamp":1425081600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Lang Resources &amp; Evaluation"],"published-print":{"date-parts":[[2015,6]]},"DOI":"10.1007\/s10579-015-9298-3","type":"journal-article","created":{"date-parts":[[2015,2,27]],"date-time":"2015-02-27T09:08:28Z","timestamp":1425028108000},"page":"227-261","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["Text Categorization from category name in an industry-motivated scenario"],"prefix":"10.1007","volume":"49","author":[{"given":"Chaya","family":"Liebeskind","sequence":"first","affiliation":[]},{"given":"Lili","family":"Kotlerman","sequence":"additional","affiliation":[]},{"given":"Ido","family":"Dagan","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,2,28]]},"reference":[{"key":"9298_CR1","unstructured":"Ali, A., Magdy, W., & Vogel, S. (2013). A tool for monitoring and analyzing healthcare tweets. In HSD workshop, SIGIR 2013."},{"issue":"8","key":"9298_CR2","doi-asserted-by":"crossref","first-page":"1485","DOI":"10.1287\/mnsc.1110.1370","volume":"57","author":"N Archak","year":"2011","unstructured":"Archak, N., Ghose, A., & Ipeirotis, P. G. (2011). Deriving the pricing power of product features by mining consumer reviews. Management Science, 57(8), 1485\u20131509.","journal-title":"Management Science"},{"key":"9298_CR3","doi-asserted-by":"crossref","unstructured":"Barak, L., Dagan, I., & Shnarch, E. (2009). Text categorization from category name via lexical reference. In Proceedings of human language technologies: The 2009 annual conference of the North American chapter of the Association for Computational Linguistics, Companion volume: Short papers, NAACL-Short\u201909 (pp. 33\u201336). Association for Computational Linguistics, Stroudsburg, PA, USA. http:\/\/dl.acm.org\/citation.cfm?id=1620853.1620864","DOI":"10.3115\/1620853.1620864"},{"key":"9298_CR4","unstructured":"Baroni, M., & Zamparelli, R. (2010). Nouns are vectors, adjectives are matrices: Representing adjective-noun constructions in semantic space. In Proceedings of the 2010 conference on empirical methods in natural language processing, EMNLP\u201910 (pp. 1183\u20131193). Association for Computational Linguistics, Stroudsburg, PA, USA. http:\/\/dl.acm.org\/citation.cfm?id=1870658.1870773"},{"key":"9298_CR5","first-page":"993","volume":"3","author":"DM Blei","year":"2003","unstructured":"Blei, D. M., Ng, A. Y., & Jordan, M. I. (2003). Latent dirichlet allocation. Journal of Machine Learning Research, 3, 993\u20131022.","journal-title":"Journal of Machine Learning Research"},{"key":"9298_CR7","unstructured":"Church, K.W., & Hanks, P. (1990). Word association norms, mutual information, and lexicography. Computational linguistics, 16(1), 22\u201329. http:\/\/dl.acm.org\/citation.cfm?id=89086.89095"},{"key":"9298_CR6","unstructured":"de Buenaga Rodriguez, M., Go\u2019mez-Hidalgo, J. M., & Diaz-Agudo, B. (1997). Using WordNet to complement training information in text categorization. In N. Nicolov, & R. Mitkov (Eds.), Recent advances in natural language processing II: Selected papers from the second international conference on recent advances in natural language processing (RANLP 1997), March 25\u201327, 1997, Stanford, CA, USA, Amsterdam Studies in the Theory and History of Linguistic Science, Series IV: Current Issues in Linguistic Theory (pp. 353\u2013364). Amsterdam, The Netherlands: John Benjamins Publishing."},{"issue":"6","key":"9298_CR8","doi-asserted-by":"crossref","first-page":"391","DOI":"10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9","volume":"41","author":"S Deerwester","year":"1990","unstructured":"Deerwester, S., Dumais, S. T., Furnas, G. W., Landauer, T. K., & Harshman, R. (1990). Indexing by latent semantic analysis. Journal of the American Society for Information Science, 41(6), 391\u2013407.","journal-title":"Journal of the American Society for Information Science"},{"key":"9298_CR9","doi-asserted-by":"crossref","unstructured":"Diakopoulos, N., Naaman, M., & Kivran-Swaine, F.: Diamonds in the rough: Social media visual analytics for journalistic inquiry. In 2010 IEEE symposium on visual analytics science and technology (VAST) (pp. 115\u2013122). IEEE (2010).","DOI":"10.1109\/VAST.2010.5652922"},{"key":"9298_CR10","unstructured":"Downey, D., & Etzioni, O. (2008). Look ma, no hands: Analyzing the monotonic feature abstraction for text classification. In Proceedings of the 22nd Annual Conference on Neural Information Processing Systems (NIPS-08), Vancouver, Canada. http:\/\/books.nips.cc\/papers\/files\/nips21\/NIPS2008_0054.pdf"},{"key":"9298_CR11","doi-asserted-by":"crossref","unstructured":"Eichler, K., Gabryszak, A., & Neumann, G. (2014). An analysis of textual inference in german customer emails. Lexical and Computational Semantics (*SEM 2014) p. 69.","DOI":"10.3115\/v1\/S14-1009"},{"issue":"4","key":"9298_CR12","doi-asserted-by":"crossref","first-page":"419","DOI":"10.1007\/s13218-012-0221-4","volume":"26","author":"K Eichler","year":"2012","unstructured":"Eichler, K., Meisdrock, M., & Schmeier, S. (2012). Search and topic detection in customer requests. KI-K\u00fcnstliche Intelligenz, 26(4), 419\u2013422.","journal-title":"KI-K\u00fcnstliche Intelligenz"},{"key":"9298_CR13","volume-title":"WordNet: An electronic lexical database","year":"1998","unstructured":"Fellbaum, C. (Ed.). (1998). WordNet: An electronic lexical database. Cambridge: MIT Press."},{"key":"9298_CR14","doi-asserted-by":"crossref","unstructured":"Fleischman, M., & Hovy, E. (2002). Fine grained classification of named entities. In Proceedings of the 19th international conference on computational linguistics\u2014COLING\u201902, (Vol. 1, pp. 1\u20137). Stroudsburg, PA, USA: Association for Computational Linguistics. doi: 10.3115\/1072228.1072358","DOI":"10.3115\/1072228.1072358"},{"key":"9298_CR15","doi-asserted-by":"crossref","unstructured":"Funk, A., Li, Y., Saggion, H., Bontcheva, K., & Leibold, C. (2008). Opinion analysis for business intelligence applications. In Proceedings of the first international workshop on Ontology-supported business intelligence. New York: ACM.","DOI":"10.1145\/1452567.1452570"},{"key":"9298_CR16","unstructured":"Gabrilovich, E., & Markovitch, S. (2007). Computing semantic relatedness using wikipedia-based explicit semantic analysis. In IJCAI, pp. 1606\u20131611."},{"key":"9298_CR17","doi-asserted-by":"crossref","unstructured":"Giampiccolo, D., Magnini, B., Dagan, I., & Dolan, B. (2007). The third pascal recognizing textual entailment challenge. In Proceedings of the ACL-PASCAL workshop on textual entailment and paraphrasing, RTE\u201907 (pp. 1\u20139). Stroudsburg, PA, USA: Association for Computational Linguistics. http:\/\/dl.acm.org\/citation.cfm?id=1654536.1654538","DOI":"10.3115\/1654536.1654538"},{"key":"9298_CR18","doi-asserted-by":"crossref","unstructured":"Glickman, O., & Dagan, I. (2005). A probabilistic setting and lexical cooccurrence model for textual entailment. In Proceedings of the ACL workshop on empirical modeling of semantic equivalence and entailment, EMSEE\u201905, (pp. 43\u201348). Stroudsburg, PA, USA: Association for Computational Linguistics. http:\/\/dl.acm.org\/citation.cfm?id=1631862.1631870","DOI":"10.3115\/1631862.1631870"},{"key":"9298_CR19","doi-asserted-by":"crossref","unstructured":"Glickman, O., Shnarch, E., & Dagan, I. (2006). Lexical reference: A semantic matching subtask. In Proceedings of the 2006 conference on empirical methods in natural language processing, EMNLP\u201906 (pp. 172\u2013179). Stroudsburg, PA, USA: Association for Computational Linguistics. http:\/\/dl.acm.org\/citation.cfm?id=1610075.1610103","DOI":"10.3115\/1610075.1610103"},{"key":"9298_CR20","doi-asserted-by":"crossref","unstructured":"Gliozzo, A., Strapparava, C., & Dagan, I. (2005). Investigating unsupervised learning for text categorization bootstrapping. In Proceedings of the conference on human language technology and empirical methods in natural language processing, HLT\u201905, (pp. 129\u2013136). Stroudsburg, PA, USA: Association for Computational Linguistics. doi: 10.3115\/1220575.1220592","DOI":"10.3115\/1220575.1220592"},{"issue":"1","key":"9298_CR21","doi-asserted-by":"crossref","first-page":"1:1","DOI":"10.1145\/1596515.1596516","volume":"6","author":"A Gliozzo","year":"2009","unstructured":"Gliozzo, A., Strapparava, C., & Dagan, I. (2009). Improving text categorization bootstrapping via unsupervised learning. ACM Transactions on Speech and Language Processing, 6(1), 1:1\u20131:24. doi: 10.1145\/1596515.1596516","journal-title":"ACM Transactions on Speech and Language Processing"},{"key":"9298_CR22","unstructured":"Grefenstette, E., & Sadrzadeh, M. (2011). Experimental support for a categorical compositional distributional model of meaning. In Proceedings of the conference on empirical methods in natural language processing, EMNLP\u201911 (pp. 1394\u20131404). Stroudsburg, PA, USA: Association for Computational Linguistics. http:\/\/dl.acm.org\/citation.cfm?id=2145432.2145580"},{"key":"9298_CR23","doi-asserted-by":"crossref","unstructured":"Hu, M., & Liu, B. (2004). Mining and summarizing customer reviews. In Proceedings of the tenth ACM SIGKDD international conference on knowledge discovery and data mining, KDD\u201904, (pp. 168\u2013177). New York, NY, USA: ACM. doi: 10.1145\/1014052.1014073","DOI":"10.1145\/1014052.1014073"},{"key":"9298_CR24","doi-asserted-by":"crossref","unstructured":"Ko, Y., & Seo, J. (2004). Learning with unlabeled data for text categorization using bootstrapping and feature projection techniques. In Proceedings of the 42nd annual meeting on association for computational linguistics, ACL\u201904. Stroudsburg, PA, USA: Association for Computational Linguistics. doi: 10.3115\/1218955.1218988","DOI":"10.3115\/1218955.1218988"},{"key":"9298_CR25","doi-asserted-by":"crossref","unstructured":"Li, C., Weng, J., He, Q., Yao, Y., Datta, A., Sun, A., & Lee, B. S. (2012). Twiner: Named entity recognition in targeted twitter stream. In Proceedings of the 35th international ACM SIGIR conference on research and development in information retrieval, SIGIR\u201912 (pp. 721\u2013730). New York, NY, USA: ACM. doi: 10.1145\/2348283.2348380","DOI":"10.1145\/2348283.2348380"},{"key":"9298_CR26","unstructured":"Liu, B., Li, X., Lee, W. S., & Yu, P. S. (2004). Text classification by labeling words. In Proceedings of the 19th national conference on Artifical intelligence, AAAI\u201904, (pp. 425\u2013430). San Jose: AAAI Press. http:\/\/dl.acm.org\/citation.cfm?id=1597148.1597218"},{"key":"9298_CR27","doi-asserted-by":"crossref","unstructured":"Liu, B., & Zhang, L. (2012). A survey of opinion mining and sentiment analysis. In Mining text data, (pp. 415\u2013463). Berlin: Springer.","DOI":"10.1007\/978-1-4614-3223-4_13"},{"key":"9298_CR28","unstructured":"Mansuy, T., & Hilderman, R. J. (2006). A characterization of wordnet features in boolean models for text classification. In Proceedings of the fifth Australasian conference on data mining and analystics\u2014AusDM\u201906, (Vol. 61, pp. 103\u2013109). Darlinghurst, Australia: Australian Computer Society Inc. http:\/\/dl.acm.org\/citation.cfm?id=1273808.1273822"},{"key":"9298_CR29","doi-asserted-by":"crossref","unstructured":"Maynard, D., & Funk, A. (2012). Automatic detection of political opinions in tweets. In The semantic web: ESWC 2011 workshops (pp. 88\u201399). Berlin: Springer.","DOI":"10.1007\/978-3-642-25953-1_8"},{"key":"9298_CR30","unstructured":"Mccallum, A., & Nigam, K. (1999). Text classification by bootstrapping with keywords, em and shrinkage. In ACL99\u2014Workshop for unsupervised learning in natural language processing (pp. 52\u201358)."},{"key":"9298_CR31","doi-asserted-by":"crossref","unstructured":"Metzler, D., Dumais, S. T., & Meek, C. (2007). Similarity measures for short segments of text. In ECIR (pp. 16\u201327).","DOI":"10.1007\/978-3-540-71496-5_5"},{"issue":"8","key":"9298_CR32","doi-asserted-by":"crossref","first-page":"1388","DOI":"10.1111\/j.1551-6709.2010.01106.x","volume":"34","author":"J Mitchell","year":"2010","unstructured":"Mitchell, J., & Lapata, M. (2010). Composition in distributional models of semantics. Cognitive Science, 34(8), 1388\u20131439.","journal-title":"Cognitive Science"},{"key":"9298_CR33","unstructured":"Pasca, M., & Harabagiu, S. M. (2001). The informative role of WordNet in open-domain question answering. In Proceedings of the NAACL 2001 workshop on wordnet and other lexical resources: Applications, extensions and customizations (pp. 138\u2013143)."},{"key":"9298_CR34","doi-asserted-by":"crossref","unstructured":"Ritter, A., Etzioni Mausam, O., & Clark, S. (2012). Open domain event extraction from twitter. In Proceedings of the 18th ACM SIGKDD international conference on knowledge discovery and data mining, KDD\u201912 (pp. 1104\u20131112). New York, NY, USA: ACM. doi: 10.1145\/2339530.2339704","DOI":"10.1145\/2339530.2339704"},{"key":"9298_CR35","doi-asserted-by":"crossref","first-page":"77","DOI":"10.3115\/1613984.1614004","volume-title":"HLT-NAACL 2004: Short Papers","author":"A Rosenberg","year":"2004","unstructured":"Rosenberg, A., & Binkowski, E. (2004). Augmenting the kappa statistic to determine interannotator reliability for multiply labeled data points. In D. M. Susan Dumais & S. Roukos (Eds.), HLT-NAACL 2004: Short Papers (pp. 77\u201380). Boston, MA: Association for Computational Linguistics."},{"key":"9298_CR36","unstructured":"Ruhl, J., Datar, M., & Lee, J. (2006). Method, system and graphical user interface for providing reviews for a product. https:\/\/www.google.com\/patents\/US20060143158 . US Patent App. 11\/012,846"},{"issue":"17","key":"9298_CR37","first-page":"119","volume":"10","author":"H Saggion","year":"2009","unstructured":"Saggion, H., & Funk, A. (2009). Extracting opinions and facts for business intelligence. RNTI Journal, 10(17), 119\u2013146.","journal-title":"RNTI Journal"},{"issue":"1","key":"9298_CR38","doi-asserted-by":"crossref","first-page":"121","DOI":"10.1080\/19331680802149582","volume":"5","author":"A Scharl","year":"2008","unstructured":"Scharl, A., & Weichselbraun, A. (2008). An automated approach to investigating the online media coverage of US presidential elections. Journal of Information Technology & Politics, 5(1), 121\u2013132.","journal-title":"Journal of Information Technology & Politics"},{"key":"9298_CR39","unstructured":"Scott, S., & Matwin, S. (1999). Feature engineering for text classification. In Proceedings of the sixteenth international conference on machine learning, ICML\u201999, pp. 379\u2013388. San Francisco, CA, USA: Morgan Kaufmann Publishers Inc. http:\/\/dl.acm.org\/citation.cfm?id=645528.657484"},{"issue":"1","key":"9298_CR40","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/505282.505283","volume":"34","author":"F Sebastiani","year":"2002","unstructured":"Sebastiani, F. (2002). Machine learning in automated text categorization. ACM Computing Surveys, 34(1), 1\u201347. doi: 10.1145\/505282.505283","journal-title":"ACM Computing Surveys"},{"key":"9298_CR41","doi-asserted-by":"crossref","unstructured":"Shah, C., & Croft, W. B. (2004). Evaluating high accuracy retrieval techniques. In Proceedings of the 27th annual international ACM SIGIR conference on Research and development in information retrieval, SIGIR\u201904 (pp. 2\u20139). New York, NY, USA: ACM. doi: 10.1145\/1008992.1008996","DOI":"10.1145\/1008992.1008996"},{"key":"9298_CR42","doi-asserted-by":"crossref","unstructured":"Shnarch, E., Barak, L., & Dagan, I. (2009). Extracting lexical reference rules from wikipedia. In Proceedings of the joint conference of the 47th annual meeting of the ACL and the 4th international joint conference on natural language processing of the AFNLP, ACL\u201909 (Vol. 1, pp. 450\u2013458). Stroudsburg, PA, USA: Association for Computational Linguistics. http:\/\/dl.acm.org\/citation.cfm?id=1687878.1687942","DOI":"10.3115\/1687878.1687942"},{"key":"9298_CR43","unstructured":"Smadja, F., McKeown, K. R., & Hatzivassiloglou, V. (1996). Translating collocations for bilingual lexicons: A statistical approach. Computational Linguistics, 22(1), 1\u201338. http:\/\/dl.acm.org\/citation.cfm?id=234285.234287"},{"key":"9298_CR44","unstructured":"Socher, R., Huval, B., Manning, C. D., & Ng, A. Y. (2012). Semantic compositionality through recursive matrix-vector spaces. In Proceedings of the 2012 joint conference on empirical methods in natural language processing and computational natural language learning, EMNLP-CoNLL\u201912 (pp. 1201\u20131211). Stroudsburg, PA, USA: Association for Computational Linguistics. http:\/\/dl.acm.org\/citation.cfm?id=2390948.2391084"},{"key":"9298_CR45","doi-asserted-by":"crossref","first-page":"178","DOI":"10.1609\/icwsm.v4i1.14009","volume":"10","author":"A Tumasjan","year":"2010","unstructured":"Tumasjan, A., Sprenger, T. O., Sandner, P. G., & Welpe, I. M. (2010). Predicting elections with twitter: What 140 characters reveal about political sentiment. ICWSM, 10, 178\u2013185.","journal-title":"ICWSM"},{"issue":"6","key":"9298_CR46","doi-asserted-by":"crossref","first-page":"80","DOI":"10.2307\/3001968","volume":"1","author":"F Wilcoxon","year":"1945","unstructured":"Wilcoxon, F. (1945). Individual comparisons by ranking methods. Biometrics Bulletin, 1(6), 80\u201383. doi: 10.2307\/3001968","journal-title":"Biometrics Bulletin"},{"key":"9298_CR47","doi-asserted-by":"crossref","unstructured":"Xu, J., & Croft, W. B. (1996). Query expansion using local and global document analysis. In Proceedings of the 19th annual international ACM SIGIR conference on research and development in information retrieval, (pp. 4\u201311). New York: ACM.","DOI":"10.1145\/243199.243202"}],"container-title":["Language Resources and Evaluation"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-015-9298-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10579-015-9298-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-015-9298-3","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,7]],"date-time":"2023-08-07T19:07:28Z","timestamp":1691435248000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10579-015-9298-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,2,28]]},"references-count":47,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2015,6]]}},"alternative-id":["9298"],"URL":"https:\/\/doi.org\/10.1007\/s10579-015-9298-3","relation":{},"ISSN":["1574-020X","1574-0218"],"issn-type":[{"value":"1574-020X","type":"print"},{"value":"1574-0218","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,2,28]]}}}