{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,13]],"date-time":"2026-02-13T05:46:22Z","timestamp":1770961582161,"version":"3.50.1"},"publisher-location":"Berlin, Heidelberg","reference-count":23,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"value":"9783540786450","type":"print"},{"value":"9783540786467","type":"electronic"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1007\/978-3-540-78646-7_22","type":"book-chapter","created":{"date-parts":[[2008,3,26]],"date-time":"2008-03-26T12:45:33Z","timestamp":1206535533000},"page":"222-233","source":"Crossref","is-referenced-by-count":26,"title":["Automatic Extraction of Domain-Specific Stopwords from Labeled Documents"],"prefix":"10.1007","author":[{"given":"Masoud","family":"Makrehchi","sequence":"first","affiliation":[]},{"given":"Mohamed S.","family":"Kamel","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"22_CR1","unstructured":"Chen, A., Gey, F.C.: Building an Arabic stemmer for information retrieval. In: TREC (2002)"},{"key":"22_CR2","unstructured":"Craven, M., DiPasquo, D., Freitag, D., McCallum, A., Mitchell, T., Nigam, K., Slattery, S.: Learning to extract symbolic knowledge from the world wide web. In: Proceedings of the 15th National Conference on Artificial Intelligence (AAAI 1998), pp. 509\u2013516 (1998)"},{"key":"22_CR3","doi-asserted-by":"crossref","unstructured":"Crow, D., De Santo, J.: A hybrid approach to concept extraction and recognition-based matching in the domain of human resources. In: ICTAI, pp. 535\u2013539 (2004)","DOI":"10.1109\/ICTAI.2004.12"},{"key":"22_CR4","doi-asserted-by":"publisher","first-page":"1289","DOI":"10.1162\/153244303322753670","volume":"3","author":"G. Forman","year":"2003","unstructured":"Forman, G.: An extensive empirical study of feature selection metrics for text classification. Journal of Machine Learning Research\u00a03, 1289\u20131305 (2003)","journal-title":"Journal of Machine Learning Research"},{"key":"22_CR5","doi-asserted-by":"crossref","unstructured":"Forman, G.: A pitfall and solution in multi-class feature selection for text classification. In: Proceedings of ICML 2004, Twenty-first international conference on Machine learning, pp. 297\u2013304 (2004)","DOI":"10.1145\/1015330.1015356"},{"key":"22_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/1083142.1083153","volume-title":"MSR 2005: Proceedings of the 2005 international workshop on Mining software repositories","author":"J.H. Hayes","year":"2005","unstructured":"Hayes, J.H., Dekhtyar, A., Sundaram, S.: Text mining for software engineering: how analyst feedback impacts final results. In: MSR 2005: Proceedings of the 2005 international workshop on Mining software repositories, pp. 1\u20135. ACM Press, New York (2005)"},{"key":"22_CR7","first-page":"143","volume-title":"Proceedings of ICML 1997, 14th International Conference on Machine Learning","author":"T. Joachims","year":"1997","unstructured":"Joachims, T.: A probabilistic analysis of the Rocchio algorithm with TFIDF for text categorization. In: Fisher, D.H. (ed.) Proceedings of ICML 1997, 14th International Conference on Machine Learning, Nashville, US, pp. 143\u2013151. Morgan Kaufmann Publishers, San Francisco (1997)"},{"key":"22_CR8","first-page":"3010","volume-title":"Proceedings of the 34th Annual Hawaii International Conference on System Sciences (HICSS-34)","author":"M. Kawahara","year":"2001","unstructured":"Kawahara, M., Kawano, H.: Mining association algorithm with threshold based on roc analysis. In: Proceedings of the 34th Annual Hawaii International Conference on System Sciences (HICSS-34), vol.\u00a03, pp. 3010\u20133017. IEEE Computer Society, Los Alamitos (2001)"},{"key":"22_CR9","unstructured":"Koo, S.O., Lim, S.Y., Lee, S.-J.: Building an ontology based on hub words for information retrieval. In: Web Intelligence, pp. 466\u2013469 (2003)"},{"key":"22_CR10","first-page":"361","volume":"5","author":"D.D. Lewis","year":"2004","unstructured":"Lewis, D.D., Yang, Y., Rose, T.G., Li, F.: RCV1: A new benchmark collection for text categorization research. Journal of Machine Learning Research\u00a05, 361\u2013397 (2004)","journal-title":"Journal of Machine Learning Research"},{"key":"22_CR11","unstructured":"Liu, T., Liu, S., Chen, Z., Ma, W.-Y.: An evaluation on feature selection for text clustering. In: Proceedings of ICML 2003, pp. 488\u2013495 (2003)"},{"issue":"1","key":"22_CR12","first-page":"3","volume":"3","author":"R.T. Lo","year":"2005","unstructured":"Lo, R.T., He, B., Ounis, I.: Automatically building a stopword list for an information retrieval system. The Journal on Digital Information Management: special issue on the 5th Dutch-Belgian Information Retrieval Workshop (DIR 2005)\u00a03(1), 3\u20138 (2005)","journal-title":"The Journal on Digital Information Management: special issue on the 5th Dutch-Belgian Information Retrieval Workshop (DIR 2005)"},{"key":"22_CR13","doi-asserted-by":"crossref","unstructured":"Maletic, J.I., Valluri, N.: Automatic software clustering via latent semantic analysis. In: Proceedings 14th IEEE International Conference on Automated Software Engineering (ASE 1999), Cocoa Beach Florida, October 1999, pp. 251\u2013254 (1999)","DOI":"10.1109\/ASE.1999.802296"},{"key":"22_CR14","first-page":"359","volume-title":"Proceedings of ICML 1998, 15th International Conference on Machine Learning","author":"A.K. McCallum","year":"1998","unstructured":"McCallum, A.K., Rosenfeld, R., Mitchell, T.M., Ng, A.Y.: Improving text classification by shrinkage in a hierarchy of classes. In: Shavlik, J.W. (ed.) Proceedings of ICML 1998, 15th International Conference on Machine Learning, Madison, US, pp. 359\u2013367. Morgan Kaufmann Publishers, San Francisco (1998)"},{"key":"22_CR15","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"401","DOI":"10.1007\/978-3-540-30222-3_39","volume-title":"Comparative Evaluation of Multilingual Information Access Systems","author":"V. Petras","year":"2004","unstructured":"Petras, V., Perelman, N., Gey, F.C.: UC berkeley at clef-2003 - Russian language experiments and domain-specific retrieval. In: Peters, C., Gonzalo, J., Braschler, M., Kluck, M. (eds.) CLEF 2003. LNCS, vol.\u00a03237, pp. 401\u2013411. Springer, Heidelberg (2004)"},{"key":"22_CR16","doi-asserted-by":"crossref","unstructured":"Rijsbergen, C.J., Harper, D.J., Porter, M.F.: The selection of good search terms. In: Information Processing and Management, pp. 77\u201391 (1981)","DOI":"10.1016\/0306-4573(81)90029-7"},{"key":"22_CR17","doi-asserted-by":"crossref","unstructured":"Rogati, M., Yang, Y.: High-performing feature selection for text classification. In: Proceedings of the eleventh international conference on Information and knowledge management, pp. 659\u2013661 (2002)","DOI":"10.1145\/584792.584911"},{"key":"22_CR18","doi-asserted-by":"crossref","unstructured":"Savoy, J.: A stemming procedure and stopword list for general French corpora. Journal of the American Society for Information Science, 944\u2013952 (1999)","DOI":"10.1002\/(SICI)1097-4571(1999)50:10<944::AID-ASI9>3.0.CO;2-Q"},{"key":"22_CR19","doi-asserted-by":"crossref","unstructured":"Seki, K., Mostafa, J.: An application of text categorization methods to gene ontology annotation. In: SIGIR, pp. 138\u2013145 (2005)","DOI":"10.1145\/1076034.1076060"},{"key":"22_CR20","unstructured":"Sinka, M.P., Corne, D.W.: Evolving better stoplists for document clustering and web intelligence. Design and application of hybrid intelligent systems, 1015\u20131023 (2003)"},{"key":"22_CR21","doi-asserted-by":"publisher","first-page":"396","DOI":"10.1109\/WI.2003.1241221","volume-title":"Proceedings of the IEEE\/WIC International Conference on Web Intelligence","author":"M.P. Sinka","year":"2003","unstructured":"Sinka, M.P., Corne, D.W.: Towards modernised and web-specific stoplists for web document analysis. In: Proceedings of the IEEE\/WIC International Conference on Web Intelligence, pp. 396\u2013402. IEEE Computer Society, Los Alamitos (2003)"},{"key":"22_CR22","unstructured":"Van Rijsbergen, C.J.: Information Retrieval, 2nd edn., Dept. of Computer Science, University of Glasgow (1979)"},{"key":"22_CR23","first-page":"412","volume-title":"Proceedings of ICML 1997, 14th International Conference on Machine Learning","author":"Y. Yang","year":"1997","unstructured":"Yang, Y., Pedersen, J.O.: A comparative study on feature selection in text categorization. In: Fisher, D.H. (ed.) Proceedings of ICML 1997, 14th International Conference on Machine Learning, Nashville, US, pp. 412\u2013420. Morgan Kaufmann Publishers, San Francisco (1997)"}],"container-title":["Lecture Notes in Computer Science","Advances in Information Retrieval"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-78646-7_22.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,4,27]],"date-time":"2021-04-27T11:16:50Z","timestamp":1619522210000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-78646-7_22"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"ISBN":["9783540786450","9783540786467"],"references-count":23,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-78646-7_22","relation":{},"subject":[]}}