{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T07:26:54Z","timestamp":1740122814458,"version":"3.37.3"},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2015,6,9]],"date-time":"2015-06-09T00:00:00Z","timestamp":1433808000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Speech Technol"],"published-print":{"date-parts":[[2016,6]]},"DOI":"10.1007\/s10772-015-9284-6","type":"journal-article","created":{"date-parts":[[2015,6,9]],"date-time":"2015-06-09T17:21:42Z","timestamp":1433870502000},"page":"191-201","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["Semantic similarity based approach for reducing Arabic texts dimensionality"],"prefix":"10.1007","volume":"19","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7067-5658","authenticated-orcid":false,"given":"Arafat","family":"Awajan","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2015,6,9]]},"reference":[{"key":"9284_CR1","unstructured":"Almaany. (2014). Dictionary and glossary. http:\/\/www.almaany.com\/ ."},{"issue":"4","key":"9284_CR2","first-page":"179","volume":"25","author":"A Awajan","year":"2007","unstructured":"Awajan, A. (2007). Arabic text preprocessing for the natural language processing applications. Arab Gulf Journal of Scientific Research, 25(4), 179\u2013189.","journal-title":"Arab Gulf Journal of Scientific Research"},{"key":"9284_CR3","doi-asserted-by":"crossref","unstructured":"Awajan, A. (2015). Semantic vector space model for reducing arabic text dimensionality. In Proceedings of the 5th international conference on digital information and communication technology and its applications, Lebanon, (pp. 129\u2013135). April 29\u2013May 1, 2015.","DOI":"10.1109\/DICTAP.2015.7113185"},{"key":"9284_CR4","unstructured":"Baker, K. (2013). Singular value decomposition tutorial. Note for NLP Seminar. 1\u201324. Accessed December 2013, from www.ling.ohio-state.edu\/~kbaker\/pubs\/Singular_Value_Decomposition_Tutorial.pdf ."},{"key":"9284_CR5","unstructured":"Beesley, K. R. (1998). Consonant spreading in Arabic stems. In COLING-ACL\u201998, vol 1, pp 117\u2013123, Montreal, Quebec, Canada, August 10\u201314."},{"key":"9284_CR6","unstructured":"Biemann, C. (2006). Chinese whispers\u2014An efficient graph clustering algorithm and its application to natural language processing problems. Workshop on TextGraphs, at HLT-NAACL 2006, pp. 73\u201380"},{"key":"9284_CR7","unstructured":"Boudlal, A., Lakhouaja, A., Mazroui, A., Meziane, A., Ould Abdallahi, O. B. M., & Shoul, M. (2010). Alkhalil Morpho Sys: A morphosyntactic analysis system for Arabic texts. In International Arab conference on information technology. http:\/\/www.itpapers.info\/acit10\/Papers\/f653 ."},{"key":"9284_CR8","doi-asserted-by":"crossref","first-page":"890","DOI":"10.3758\/s13428-011-0183-8","volume":"44","author":"JA Bullinaria","year":"2012","unstructured":"Bullinaria, J. A., & Levy, J. P. (2012). Extracting semantic representations from word co-occurrence statistics: Stop-lists, stemming and SVD. Behavior Research Methods, 44, 890\u2013907.","journal-title":"Behavior Research Methods"},{"issue":"11","key":"9284_CR9","doi-asserted-by":"crossref","first-page":"2347","DOI":"10.1002\/asi.21173","volume":"60","author":"R Duwairi","year":"2009","unstructured":"Duwairi, R., Al-Refai, M. N., & Khasawneh, N. (2009). Feature reduction techniques for Arabic text categorization. Journal of the American Society for Information Science and Technology, 60(11), 2347\u20132352.","journal-title":"Journal of the American Society for Information Science and Technology"},{"key":"9284_CR10","unstructured":"Elkateb, S., Black, W., Rodr\u00edguez, H., Alkhalifa, M., Vossen, P., Pease, A., & Fellbaum, C. (2006). Building a WordNet for Arabic. In Proceedings of the fifth international conference on language resources and evaluation (LREC 2006). Genoa, Italy, May 22\u201328, 2006."},{"key":"9284_CR11","unstructured":"Froud, H., Lachkar, A., & Ouatik, S. A. (2012). A comparative study of root-based and stem-based approaches for measuring similarity between Arabic words for Arabic text mining applications. Advanced Computing: An International Journal (ACIJ), 3(6)."},{"key":"9284_CR12","unstructured":"Green, S., & Manning, C. D. (2010). Better Arabic parsing: Baselines, evaluations, and analysis. In COLING, Beijing (pp. 394\u2013402)."},{"key":"9284_CR13","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-031-02139-8","volume-title":"Introduction to Arabic natural language processing","author":"N Habash","year":"2010","unstructured":"Habash, N. (2010). Introduction to Arabic natural language processing. San Rafael: Morgan & Claypool Publishers."},{"key":"9284_CR14","doi-asserted-by":"crossref","unstructured":"Hagiwara, M. (2008). A supervised learning approach to automatic synonym identification based on distributional features. In Proceedings of the ACL-08, Columbus, June 2008 (pp. 1\u20136).","DOI":"10.3115\/1564154.1564156"},{"key":"9284_CR15","doi-asserted-by":"crossref","unstructured":"Harrag, F., El-Qawasmah, E., & Al-Salman, A. M. (2010). Comparing dimension reduction techniques for Arabic text classification using BPNN algorithm. In IEEE first international conference on integrated intelligent computing, pp. 6\u201311.","DOI":"10.1109\/ICIIC.2010.23"},{"issue":"23","key":"9284_CR16","doi-asserted-by":"crossref","first-page":"146","DOI":"10.1080\/00437956.1954.11659520","volume":"10","author":"Z Harris","year":"1954","unstructured":"Harris, Z. (1954). Distributional structure. Word, 10(23), 146\u2013162.","journal-title":"Word"},{"issue":"2","key":"9284_CR17","first-page":"58","volume":"2","author":"AM Hasnah","year":"2002","unstructured":"Hasnah, A. M., & Al-Ja\u2019am, J. M. (2002). Thesaurus-based query disambiguation method for cross-language information retrieval. International Journal Intelligent Computing and Information Sciences, 2(2), 58\u201368.","journal-title":"International Journal Intelligent Computing and Information Sciences"},{"key":"9284_CR18","unstructured":"Heintz, I. (2010). Arabic language modeling with stem-derived morphemes for automatic speech recognition. Ph.D. thesis, Graduate School of The Ohio State University."},{"issue":"10","key":"9284_CR19","doi-asserted-by":"crossref","first-page":"867","DOI":"10.1002\/(SICI)1097-4571(199710)48:10<867::AID-ASI3>3.0.CO;2-#","volume":"48","author":"I Hmeidi","year":"1997","unstructured":"Hmeidi, I., Kanaan, G., & Evens, M. (1997). Design and implementation of automatic indexing for information retrieval with arabic documents. Journal of the American Society for Information Science, 48(10), 867\u2013881.","journal-title":"Journal of the American Society for Information Science"},{"issue":"4","key":"9284_CR20","doi-asserted-by":"crossref","first-page":"589","DOI":"10.1016\/j.csl.2005.10.001","volume":"20","author":"K Kirchhoff","year":"2006","unstructured":"Kirchhoff, K., Vergyri, D., Duh, K., Bilmes, J., & Stolcke, A. (2006). Morphology-based language modeling for conversational Arabic speech recognition. Computer Speech & Language, 20(4), 589\u2013608.","journal-title":"Computer Speech & Language"},{"key":"9284_CR21","unstructured":"Martins, C. A., Monard, M. C., & Matsubara, E. T. (2003). Reducing the dimensionality of bag-of-words text representation used by learning algorithms. In Proceedings of 3rd IASTED international conference on artificial intelligence and applications (AIA2003), Benalm\u00e1dena, Espanha (pp. 228\u2013233). Calgary: Acta Press."},{"key":"9284_CR22","unstructured":"Mihalcea, R., & Tarau, P. (2004). TextRank: Brining order into texts. In Proceedings of EMNLP 2004. Association for Computational Linguistics, Barcelona, Spain (pp. 404\u2013411)."},{"key":"9284_CR23","volume-title":"Using Arabic synonyms","author":"DB Parkinson","year":"2005","unstructured":"Parkinson, D. B. (2005). Using Arabic synonyms. Cambridge: Cambridge University Press."},{"key":"9284_CR24","unstructured":"Saad, M. K., & Ashour, W. (2010). OSAC: Open Source Arabic Corpus, the 6th International Symposium on Electrical and Electronics Engineering and Computer Science, European University of Lefke, Cyprus, from http:\/\/sourceforge.net\/projects\/ar-text-mining\/files\/ArabicCorpora ."},{"key":"9284_CR25","volume-title":"Introduction to modern information retrieval","author":"G Salton","year":"1986","unstructured":"Salton, G., & McGill, M. J. (1986). Introduction to modern information retrieval. New York, NY: McGraw-Hill. Inc."},{"issue":"11","key":"9284_CR26","doi-asserted-by":"crossref","first-page":"613","DOI":"10.1145\/361219.361220","volume":"18","author":"G Salton","year":"1975","unstructured":"Salton, G., Wong, A., & Yang, C. S. (1975). A vector space model for automatic indexing. Communication of the ACM, 18(11), 613\u2013620.","journal-title":"Communication of the ACM"},{"issue":"2","key":"9284_CR27","doi-asserted-by":"crossref","first-page":"469","DOI":"10.1162\/COLI_a_00178","volume":"40","author":"K Shaalan","year":"2014","unstructured":"Shaalan, K. (2014). A survey of Arabic named entity recognition and classification. Computational Linguistics, 40(2), 469\u2013510. doi: 10.1162\/COLIa00178 .","journal-title":"Computational Linguistics"},{"key":"9284_CR28","doi-asserted-by":"crossref","first-page":"141","DOI":"10.1613\/jair.2934","volume":"37","author":"PD Turney","year":"2010","unstructured":"Turney, P. D., & Pantel, P. (2010). From frequency to meaning: Vector space models of semantics. Journal of Artificial Intelligence Research, 37, 141\u2013188.","journal-title":"Journal of Artificial Intelligence Research"},{"key":"9284_CR29","volume-title":"Information retrieval","author":"CJ Rijsbergen Van","year":"1979","unstructured":"Van Rijsbergen, C. J. (1979). Information retrieval (2nd ed.). Cambridge: Computer Laboratory, University of Cambridge.","edition":"2"},{"key":"9284_CR30","doi-asserted-by":"crossref","unstructured":"Xu, J., Fraser, A., & Weischedel, R. (2002). Empirical studies in strategies for Arabic retrieval. In SIGIR\u201902, Proceedings of the 25th annual international ACMSIGIR conference on Research and development in information retrieval, Tampere, Finland (pp. 269\u2013274). August 11\u201315, 2002.","DOI":"10.1145\/564376.564424"}],"container-title":["International Journal of Speech Technology"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-015-9284-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10772-015-9284-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-015-9284-6","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,11]],"date-time":"2023-08-11T07:03:55Z","timestamp":1691737435000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10772-015-9284-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,6,9]]},"references-count":30,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2016,6]]}},"alternative-id":["9284"],"URL":"https:\/\/doi.org\/10.1007\/s10772-015-9284-6","relation":{},"ISSN":["1381-2416","1572-8110"],"issn-type":[{"type":"print","value":"1381-2416"},{"type":"electronic","value":"1572-8110"}],"subject":[],"published":{"date-parts":[[2015,6,9]]}}}