{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,17]],"date-time":"2026-03-17T15:23:49Z","timestamp":1773761029023,"version":"3.50.1"},"reference-count":20,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2013,3,10]],"date-time":"2013-03-10T00:00:00Z","timestamp":1362873600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Lang Resources &amp; Evaluation"],"published-print":{"date-parts":[[2013,6]]},"DOI":"10.1007\/s10579-013-9221-8","type":"journal-article","created":{"date-parts":[[2013,3,8]],"date-time":"2013-03-08T22:53:09Z","timestamp":1362783189000},"page":"513-538","source":"Crossref","is-referenced-by-count":98,"title":["Comparative evaluation of text classification techniques using a large diverse Arabic dataset"],"prefix":"10.1007","volume":"47","author":[{"given":"Mohammad S.","family":"Khorsheed","sequence":"first","affiliation":[]},{"given":"Abdulmohsen O.","family":"Al-Thubaity","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2013,3,10]]},"reference":[{"key":"9221_CR2","first-page":"118","volume":"1","author":"S Al-Saleem","year":"2010","unstructured":"Al-Saleem, S. (2010). Associative classification to categorize Arabic data sets. The International Journal Of ACM JORDAN, 1, 118\u2013127.","journal-title":"The International Journal Of ACM JORDAN"},{"issue":"1","key":"9221_CR4","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1093\/llc\/7.1.1","volume":"7","author":"S Atkins","year":"1992","unstructured":"Atkins, S., Clear, J., & Ostler, N. (1992). Corpus design criteria. Literary and Linguistic Computing, 7(1), 1\u201316.","journal-title":"Literary and Linguistic Computing"},{"key":"9221_CR5","doi-asserted-by":"crossref","first-page":"600","DOI":"10.3844\/jcssp.2008.600.605","volume":"4","author":"JM Bawaneh","year":"2008","unstructured":"Bawaneh, J. M., Alkoffash, M. S., & Alrabea, A. I. (2008). Arabic text classification using K-NN and Naive Bayes. Journal of Computer Science, 4, 600\u2013605.","journal-title":"Journal of Computer Science"},{"issue":"1\/2","key":"9221_CR6","doi-asserted-by":"crossref","first-page":"109","DOI":"10.1023\/A:1023824908771","volume":"19","author":"J Diederich","year":"2003","unstructured":"Diederich, J., Kindermann, J. L., Leopold, E., & PAA\u00df, G. (2003). Authorship attribution with support vector machines. Applied Intelligence, 19(1\/2), 109\u2013123.","journal-title":"Applied Intelligence"},{"issue":"8","key":"9221_CR7","doi-asserted-by":"crossref","first-page":"1005","DOI":"10.1002\/asi.20360","volume":"57","author":"R Duwairi","year":"2006","unstructured":"Duwairi, R. (2006). Machine learning for Arabic text categorization. Journal of the American Society for Information Science and Technology JASIST, 57(8), 1005\u20131010.","journal-title":"Journal of the American Society for Information Science and Technology JASIST"},{"issue":"11","key":"9221_CR8","doi-asserted-by":"crossref","first-page":"2347","DOI":"10.1002\/asi.21173","volume":"60","author":"R Duwairi","year":"2009","unstructured":"Duwairi, R., Al-Refai, M., & Khasawneh, N. (2009). Feature reduction techniques for Arabic text categorization. Journal of the American Society for Information Science, 60(11), 2347\u20132352.","journal-title":"Journal of the American Society for Information Science"},{"key":"9221_CR9","unstructured":"El-Halees, A. (2008). A comparative study on Arabic text classification, Egyptian Computer Science Journal, 30(2). http:\/\/www.informatik.uni-trier.de\/~ley\/db\/journals\/ecs\/ecs30.html"},{"key":"9221_CR10","unstructured":"Elkourdi, M., Bensaid, A., & Rachidi, T. (2004). Automatic Arabic document categorization based on the Naive Bayes algorithm. In Proceedings of COLING 20th Workshop on Computational Approaches to Arabic Script-Based Languages, (pp. 51\u201358)."},{"key":"9221_CR12","unstructured":"Kanaan, G., Al-Shalabi R., & Al-Azzam, O. (2005). Automatic text classification using Na\u00efve Bayesian algorithm on Arabic language. In Proceedings of the 5 th International Business Information Management Conference (IBIMA), (pp. 327\u2013339)."},{"issue":"9","key":"9221_CR13","doi-asserted-by":"crossref","first-page":"1836","DOI":"10.1002\/asi.20832","volume":"60","author":"G Kanaan","year":"2009","unstructured":"Kanaan, G., Al-Shalabi, R., Ghwanmeh, S., & Al-Ma\u2019adeed, H. (2009). A comparison of text-classification techniques applied to Arabic text. Journal of the American Society for Information Science and Technology, 60(9), 1836\u20131844.","journal-title":"Journal of the American Society for Information Science and Technology"},{"key":"9221_CR14","unstructured":"Khreisat, L. (2006). Arabic text classification using N-gram frequency statistics a comparative study. In Proceedings of the 2006 International Conference on Data Mining, (pp. 78\u201382)."},{"issue":"6","key":"9221_CR15","doi-asserted-by":"crossref","first-page":"430","DOI":"10.3844\/jcssp.2007.430.435","volume":"3","author":"AA Mesleh","year":"2007","unstructured":"Mesleh, A. A. (2007). Chi square feature extraction based Svms Arabic language text categorization system. Journal of Computer Science, 3(6), 430\u2013435.","journal-title":"Journal of Computer Science"},{"key":"9221_CR16","volume-title":"KDD 06 Proceedings of the 12th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, 935\u2013940","author":"I Mierswa","year":"2006","unstructured":"Mierswa, I., Wurst, M., Klinkenberg, R., Scholz, M., & Euler, T. (2006). YALE: Rapid prototyping for complex data mining tasks. In L. Ungar, M. Craven, D. Gunopulos, & T. Eliassi-Rad (Eds.), KDD 06 Proceedings of the 12th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, 935\u2013940. New York, USA: ACM."},{"key":"9221_CR17","unstructured":"Sawaf, H., Zaplo, J., & Ney, H. (2001). Statistical classification methods for Arabic news articles. Arabic Natural Language Processing Workshop, ACL\u20192001, (pp. 127\u2013132)."},{"issue":"1","key":"9221_CR18","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/505282.505283","volume":"34","author":"F Sebastiani","year":"2002","unstructured":"Sebastiani, F. (2002). Machine learning in automated text categorization. ACM Computing Surveys, 34(1), 1\u201347.","journal-title":"ACM Computing Surveys"},{"key":"9221_CR19","first-page":"17","volume-title":"Studies in anglistics","author":"J Sinclair","year":"1995","unstructured":"Sinclair, J. (1995). Corpus typology\u2013a framework for classification. In G. Melchers & B. Warren (Eds.), Studies in anglistics (pp. 17\u201333). Stockholm: Almqvist & Wiksell."},{"issue":"1","key":"9221_CR20","first-page":"1","volume":"6","author":"MM Syiam","year":"2006","unstructured":"Syiam, M. M., Fayed, Z. T., & Habib, M. B. (2006). An intelligent system for Arabic text categorization. International Journal of Intelligent Computing and Information Sciences, 6(1), 1\u201319.","journal-title":"International Journal of Intelligent Computing and Information Sciences"},{"key":"9221_CR21","unstructured":"Thabtah, F., Eljinini, M., Zamzeer, M., & Hadi, W. (2009). Na\u00efve Bayesian based on Chi Square to categorize Arabic data. In Proceedings of The 11th International Business Information Management Association Conference (IBIMA) Conference on Innovation and Knowledge Management in Twin Track Economies, (pp. 930\u2013935)."},{"key":"9221_CR22","unstructured":"Thabtah, F., Hadi, W., & Al-Shammare, G. (2008). VSMs with K-Nearest Neighbour to categorise Arabic text data. In The World Congress on Engineering and Computer Science 2008, (pp. 778\u2013781)."},{"issue":"Special Issue o","key":"9221_CR23","first-page":"69","volume":"7","author":"MM Zahran","year":"2009","unstructured":"Zahran, M. M., Kanaan, G., & Habib, M. B. (2009). Text feature selection using particle Swarm optimization algorithm. World Applied Sciences Journal, 7(Special Issue of Computer & IT), 69\u201374.","journal-title":"World Applied Sciences Journal"}],"container-title":["Language Resources and Evaluation"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-013-9221-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10579-013-9221-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-013-9221-8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,30]],"date-time":"2019-05-30T14:21:18Z","timestamp":1559226078000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10579-013-9221-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,3,10]]},"references-count":20,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2013,6]]}},"alternative-id":["9221"],"URL":"https:\/\/doi.org\/10.1007\/s10579-013-9221-8","relation":{},"ISSN":["1574-020X","1574-0218"],"issn-type":[{"value":"1574-020X","type":"print"},{"value":"1574-0218","type":"electronic"}],"subject":[],"published":{"date-parts":[[2013,3,10]]}}}