{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,25]],"date-time":"2026-02-25T19:36:52Z","timestamp":1772048212293,"version":"3.50.1"},"reference-count":103,"publisher":"Springer Science and Business Media LLC","issue":"8","license":[{"start":{"date-parts":[[2020,4,15]],"date-time":"2020-04-15T00:00:00Z","timestamp":1586908800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,4,15]],"date-time":"2020-04-15T00:00:00Z","timestamp":1586908800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/100007713","name":"Bahauddin Zakariya University","doi-asserted-by":"crossref","award":["2019-05"],"award-info":[{"award-number":["2019-05"]}],"id":[{"id":"10.13039\/100007713","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Artif Intell Rev"],"published-print":{"date-parts":[[2020,12]]},"DOI":"10.1007\/s10462-020-09828-3","type":"journal-article","created":{"date-parts":[[2020,4,15]],"date-time":"2020-04-15T13:03:42Z","timestamp":1586955822000},"page":"5559-5588","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":41,"title":["Empirical evaluation and study of text stemming algorithms"],"prefix":"10.1007","volume":"53","author":[{"given":"Abdul","family":"Jabbar","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8464-2275","authenticated-orcid":false,"given":"Sajid","family":"Iqbal","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Manzoor Ilahi","family":"Tamimy","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shafiq","family":"Hussain","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Adnan","family":"Akhunzada","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2020,4,15]]},"reference":[{"issue":"4","key":"9828_CR1","first-page":"368","volume":"9","author":"M Ababneh","year":"2012","unstructured":"Ababneh M, Al-Shalabi R, Kanaan G, Al-Nobani A (2012) Building an effective rule-based light stemmer for arabic language to improve search effectiveness. Int Arab J Inf Technol 9(4):368\u2013372","journal-title":"Int Arab J Inf Technol"},{"issue":"3","key":"9828_CR2","doi-asserted-by":"crossref","first-page":"557","DOI":"10.1080\/0952813X.2016.1212100","volume":"29","author":"K Abainia","year":"2017","unstructured":"Abainia K, Ouamour S, Sayoud H (2017) A novel robust Arabic light stemmer. J Exp Theor Artif Intell 29(3):557\u2013573","journal-title":"J Exp Theor Artif Intell"},{"issue":"2","key":"9828_CR3","first-page":"128","volume":"11","author":"A Abu-Errub","year":"2014","unstructured":"Abu-Errub A, Odeh A, Shambour Q, Hassan OAH (2014) Arabic roots extraction using morphological analysis. Int J Comput Sci Issues (IJCSI) 11(2):128","journal-title":"Int J Comput Sci Issues (IJCSI)"},{"key":"9828_CR4","doi-asserted-by":"crossref","first-page":"7374","DOI":"10.1109\/ACCESS.2017.2787798","volume":"6","author":"M Ali","year":"2018","unstructured":"Ali M, Khalid S, Aslam MH (2018) Pattern-based comprehensive Urdu stemmer and short text classification. IEEE Access 6:7374\u20137389","journal-title":"IEEE Access"},{"issue":"1","key":"9828_CR5","first-page":"138","volume":"16","author":"M Ali","year":"2019","unstructured":"Ali M, Khalid S, Saleemi M (2019) Comprehensive stemmer for morphologically rich urdu language. Int Arab J Inf Technol 16(1):138\u2013147","journal-title":"Int Arab J Inf Technol"},{"key":"9828_CR6","doi-asserted-by":"crossref","first-page":"291","DOI":"10.1016\/j.cogsys.2018.07.003","volume":"52","author":"FS Alotaibi","year":"2018","unstructured":"Alotaibi FS, Gupta V (2018) A cognitive inspired unsupervised language-independent text stemmer for Information retrieval. Cognit Syst Res 52:291\u2013300","journal-title":"Cognit Syst Res"},{"issue":"2","key":"9828_CR7","first-page":"94","volume":"27","author":"MN Al-Kabi","year":"2015","unstructured":"Al-Kabi MN, Kazakzeh SA, Ata BMA, Al-Rababah SA, Alsmadi IM (2015) A novel root based Arabic stemmer. J King Saud Univ-Comput Inf Sci 27(2):94\u2013103","journal-title":"J King Saud Univ-Comput Inf Sci"},{"issue":"6","key":"9828_CR8","first-page":"702","volume":"9","author":"A Al-Omari","year":"2014","unstructured":"Al-Omari A, Abuata B (2014) Arabic light stemmer (ARS). J Eng Sci Technol 9(6):702\u2013717","journal-title":"J Eng Sci Technol"},{"key":"9828_CR9","doi-asserted-by":"crossref","unstructured":"AlSerhan HM, Alqrainy S, Ayesh A (2008, November). Is paice method suitable for evaluating Arabic stemming algorithms? In: International conference on computer engineering & systems, 2008 (ICCES 2008). IEEE, pp 131\u2013135","DOI":"10.1109\/ICCES.2008.4772981"},{"key":"9828_CR10","doi-asserted-by":"crossref","unstructured":"Al-Shammari ET, Lin J. (2008, October). Towards an error-free Arabic stemming. In Proceedings of the 2nd ACM workshop on Improving non English web searching. ACM, pp 9\u201316","DOI":"10.1145\/1460027.1460030"},{"issue":"3","key":"9828_CR100","doi-asserted-by":"crossref","first-page":"189","DOI":"10.1002\/asi.10368","volume":"55","author":"IA Al-Sughaiyer","year":"2004","unstructured":"Al-Sughaiyer IA, Al-Kharashi IA (2004) Arabic morphological analysis techniques: A comprehensive survey. J American Soc Inf Sci Tech 55(3):189\u2013213","journal-title":"J American Soc Inf Sci Tech"},{"key":"9828_CR11","first-page":"693","volume-title":"Portuguese conference on artificial intelligence","author":"RV Alvares","year":"2005","unstructured":"Alvares RV, Garcia AC, Ferraz I (2005) December) STEMBR: a stemming algorithm for the Brazilian Portuguese language. Portuguese conference on artificial intelligence. Springer, Berlin, pp 693\u2013701"},{"key":"9828_CR96","unstructured":"Aronoff M, Fudeman K (2011) What is morphology? vol. 8.\nWiley, pp 2\u20133"},{"issue":"3","key":"9828_CR12","doi-asserted-by":"crossref","first-page":"687","DOI":"10.1007\/s10579-015-9311-x","volume":"50","author":"A Bimba","year":"2016","unstructured":"Bimba A, Idris N, Khamis N, Noor NF (2016) Stemming Hausa text: using affix-stripping rules and reference look-up. Lang Resour Eval 50(3):687\u2013703","journal-title":"Lang Resour Eval"},{"key":"9828_CR13","doi-asserted-by":"publisher","unstructured":"B\u00f6l\u00fcc\u00fc, Necva and Burcu Can. (2019). Unsupervised Joint PoS Tagging and Stemming for Agglutinative Languages. ACM Trans. Asian Low-Resour. Lang. Inf. Process. 18, 3, Article 25 (January 2019), 21 pages. https:\/\/doi.org\/10.1145\/3292398","DOI":"10.1145\/3292398"},{"key":"9828_CR14","doi-asserted-by":"crossref","unstructured":"Boudchiche M, Mazroui A (2015, December). Evaluation of the ambiguity caused by the absence of diacritical marks in Arabic texts: statistical study. In: 2015 5th international conference on information and communication technology and accessibility (ICTA). IEEE, pp 1\u20136","DOI":"10.1109\/ICTA.2015.7426904"},{"key":"9828_CR15","doi-asserted-by":"crossref","unstructured":"Boukhalfa I, Mostefai S, Chekkai N (2018, March) A study of graph based stemmer in Arabic extrinsic plagiarism detection. In: Proceedings of the 2nd mediterranean conference on pattern recognition and artificial intelligence. ACM, pp 27\u201332","DOI":"10.1145\/3177148.3180089"},{"issue":"1","key":"9828_CR16","doi-asserted-by":"crossref","first-page":"68","DOI":"10.1016\/j.ipm.2014.08.006","volume":"51","author":"T Brychc\u00edn","year":"2015","unstructured":"Brychc\u00edn T, Konop\u00edk M (2015) HPS: high precision stemmer. Inf Process Manag 51(1):68\u201391","journal-title":"Inf Process Manag"},{"key":"9828_CR17","unstructured":"Buckley C (1985) Implementation of the smart information retrieval system. Technical report 85\u2013686, Cornell University."},{"issue":"2","key":"9828_CR18","doi-asserted-by":"crossref","first-page":"48","DOI":"10.1109\/MCI.2014.2307227","volume":"9","author":"E Cambria","year":"2014","unstructured":"Cambria E, White B (2014) Jumping NLP curves: a review of natural language processing research. IEEE Comput Intell Mag 9(2):48\u201357","journal-title":"IEEE Comput Intell Mag"},{"issue":"7","key":"9828_CR19","first-page":"1148","volume":"3","author":"DR Chintala","year":"2013","unstructured":"Chintala DR, Reddy EM (2013) An approach to enhance the CPI using Porter stemming algorithm. Int J Adv Res Comput Sci Softw Eng 3(7):1148\u20131156","journal-title":"Int J Adv Res Comput Sci Softw Eng"},{"key":"9828_CR20","unstructured":"CISI Collection https:\/\/ir.dcs.gla.ac.uk\/resources\/test_collections\/cisi\/. Accessed 30 Dec 2019. Developed by University of Glasgow"},{"issue":"8","key":"9828_CR21","first-page":"38","volume":"125","author":"MY Dahab","year":"2015","unstructured":"Dahab MY, Ibrahim A, Al-Mutawa R (2015) A comparative study on Arabic stemmers. Int J Comput Appl 125(8):38\u201347","journal-title":"Int J Comput Appl"},{"key":"9828_CR22","doi-asserted-by":"crossref","unstructured":"Dang Q, Zhang J, Lu Y, Zhang K (2013) WordNet-based suffix tree clustering algorithm. In: International conference on information science and computer applications (ISCA 2013)","DOI":"10.2991\/isca-13.2013.12"},{"key":"9828_CR23","first-page":"21","volume":"3","author":"A Dey","year":"2014","unstructured":"Dey A, Paul A, Purkayastha BS (2014) Named entity recognition for Nepali language: a semi hybrid approach. Int J Eng Innov Technol (IJEIT) 3:21\u201325","journal-title":"Int J Eng Innov Technol (IJEIT)"},{"issue":"2","key":"9828_CR102","first-page":"89","volume":"3","author":"MH Dianati","year":"2014","unstructured":"Dianati MH, Sadreddini MH, Hossein RA, Fakhrahmad SM, Taghi-Zadeh H (2014) Words stemming based on structural and semantic similarity. Comp Eng Appl J 3(2):89\u201399","journal-title":"Comp Eng Appl J"},{"issue":"2","key":"9828_CR24","doi-asserted-by":"crossref","first-page":"28","DOI":"10.3390\/info9020028","volume":"9","author":"RAN de Oliveira","year":"2018","unstructured":"de Oliveira RAN, Junior MC (2018) Experimental analysis of stemming on jurisprudential documents retrieval. Information 9(2):28","journal-title":"Information"},{"key":"9828_CR25","unstructured":"Dukes K, Habash N (2010) Morphological annotation of Quranic Arabic. In Lrec, pp 2530\u20132536"},{"issue":"8","key":"9828_CR26","doi-asserted-by":"crossref","first-page":"2883","DOI":"10.1007\/s13369-016-2029-2","volume":"41","author":"M El-Defrawy","year":"2016","unstructured":"El-Defrawy M, El-Sonbaty Y, Belal NA (2016) A rule-based subject-correlated Arabic stemmer. Arab J Sci Eng 41(8):2883\u20132891","journal-title":"Arab J Sci Eng"},{"issue":"4","key":"9828_CR27","doi-asserted-by":"crossref","first-page":"1003","DOI":"10.1016\/j.ipm.2005.07.002","volume":"42","author":"MA Fattah","year":"2006","unstructured":"Fattah MA, Ren F, Kuroiwa S (2006) Stemming to improve translation lexicon creation form bitexts. Inf Process Manag 42(4):1003\u20131016","journal-title":"Inf Process Manag"},{"issue":"5","key":"9828_CR28","doi-asserted-by":"crossref","first-page":"840","DOI":"10.1016\/j.ipm.2016.03.004","volume":"52","author":"FN Flores","year":"2016","unstructured":"Flores FN, Moreira VP (2016) Assessing the impact of stemming accuracy on information retrieval\u2013a multilingual perspective. Inf Process Manag 52(5):840\u2013854","journal-title":"Inf Process Manag"},{"key":"9828_CR29","unstructured":"Frakes WB, Fox CJ (2003) Strength and similarity of affix removal stemming algorithms. In ACM SIGIR forum, vol 37, no 1. ACM, pp 26\u201330."},{"issue":"2","key":"9828_CR30","first-page":"1","volume":"3","author":"MS Gaidhane","year":"2015","unstructured":"Gaidhane MS, Gondhale MD, Talole MP (2015) A comparative study of stemming algorithms for natural language processing. J Eng Educ Technol (ARDIJEET) 3(2):1\u20136","journal-title":"J Eng Educ Technol (ARDIJEET)"},{"issue":"2","key":"9828_CR31","doi-asserted-by":"crossref","first-page":"28","DOI":"10.1145\/2938640","volume":"49","author":"A Giachanou","year":"2016","unstructured":"Giachanou A, Crestani F (2016) Like it or not: a survey of twitter sentiment analysis methods. ACM Comput Surv (CSUR) 49(2):28","journal-title":"ACM Comput Surv (CSUR)"},{"issue":"1","key":"9828_CR32","doi-asserted-by":"crossref","first-page":"7","DOI":"10.1002\/(SICI)1097-4571(199101)42:1<7::AID-ASI2>3.0.CO;2-P","volume":"42","author":"D Harman","year":"1991","unstructured":"Harman D (1991) How effective is suffixing. J Am Soc Inf Sci 42(1):7\u201315","journal-title":"J Am Soc Inf Sci"},{"issue":"1","key":"9828_CR33","doi-asserted-by":"crossref","first-page":"17","DOI":"10.1145\/2932710","volume":"49","author":"K Hassani","year":"2016","unstructured":"Hassani K, Lee WS (2016) Visualizing natural language descriptions: a survey. ACM Comput Surv (CSUR) 49(1):17","journal-title":"ACM Comput Surv (CSUR)"},{"key":"9828_CR34","doi-asserted-by":"crossref","first-page":"45","DOI":"10.1007\/978-3-642-31600-5_5","volume-title":"Advances in computing and information technology","author":"MS Husain","year":"2013","unstructured":"Husain MS, Ahamad F, Khalid S (2013) A language independent approach to develop Urdu stemmer. Advances in computing and information technology. Springer, Berlin, pp 45\u201353"},{"key":"9828_CR35","doi-asserted-by":"crossref","first-page":"70","DOI":"10.1002\/(SICI)1097-4571(199601)47:1<70::AID-ASI7>3.0.CO;2-#","volume":"47","author":"DA Hull","year":"1996","unstructured":"Hull DA (1996) Stemming algorithms\u2014a case study for detailed evaluation. J Am Soc Inf Sci 47:70\u201384","journal-title":"J Am Soc Inf Sci"},{"issue":"15","key":"9828_CR36","first-page":"3560","volume":"95","author":"Z Hussain","year":"2017","unstructured":"Hussain Z, Iqbal S, Saba T, Almazyad AS, Rehman A (2017) Design and development of dictionary-based stemmer for the urdu language. J Theor Appl Inf Technol 95(15):3560\u20133569","journal-title":"J Theor Appl Inf Technol"},{"key":"9828_CR37","unstructured":"Islam Md, Uddin Md, Khan M (2007) A light weight stemmer for Bengali and its use in spelling checker. Retrieved 24 March, 2019, from http:\/\/hdl.handle.net\/10361\/328"},{"key":"9828_CR38","doi-asserted-by":"crossref","unstructured":"Ismailov A, Jalil MA, Abdullah Z, Rahim NA (2016) A comparative study of stemming algorithms for use with the Uzbek language. In: 3rd international conference on computer and information sciences (ICCOINS), 2016. IEEE, pp 7\u201312","DOI":"10.1109\/ICCOINS.2016.7783180"},{"issue":"2","key":"9828_CR39","first-page":"164","volume":"29","author":"Y Jaafar","year":"2017","unstructured":"Jaafar Y, Namly D, Bouzoubaa K, Yousfi A (2017) Enhancing Arabic stemming process using resources and benchmarking tools. J King Saud Univ-Comput Inf Sci 29(2):164\u2013170","journal-title":"J King Saud Univ-Comput Inf Sci"},{"key":"9828_CR40","unstructured":"Jabbar A, Iqbal S, Khan MUG (2016a) Analysis and development of resources for Urdu text stemming. In: Proceedings of the 6th annual international conference on language and technology, KICS-CLE, UET Lahore"},{"key":"9828_CR41","doi-asserted-by":"publisher","DOI":"10.1080\/0952813X.2018.1467495","author":"A Jabbar","year":"2018","unstructured":"Jabbar A, Iqbal S, Akhunzada A, Abbas Q (2018a) An improved Urdu stemming algorithm for text mining based on multi-step hybrid approach. J Exp Theor Artif Intell. https:\/\/doi.org\/10.1080\/0952813X.2018.1467495","journal-title":"J Exp Theor Artif Intell"},{"issue":"3","key":"9828_CR42","doi-asserted-by":"crossref","first-page":"339","DOI":"10.1007\/s10462-016-9527-1","volume":"49","author":"A Jabbar","year":"2018","unstructured":"Jabbar A, Iqbal S, Khan MUG, Hussain S (2018b) A survey on Urdu and Urdu like language stemmers and stemming techniques. Artif Intell Rev 49(3):339\u2013373","journal-title":"Artif Intell Rev"},{"issue":"3","key":"9828_CR43","doi-asserted-by":"crossref","first-page":"339","DOI":"10.1007\/s10462-016-9527-1","volume":"49","author":"A Jabbar","year":"2018","unstructured":"Jabbar A, Iqbal S, Khan MUG, Hussain S (2018b) A survey on Urdu and Urdu like language stemmers and stemming techniques. Artif Intell Rev 49(3):339\u2013373","journal-title":"Artif Intell Rev"},{"issue":"6","key":"9828_CR99","first-page":"1930","volume":"2","author":"AG Jivani","year":"2011","unstructured":"Jivani AG (2011) A comparative study of stemming algorithms. Int J Comp Tech Appl 2(6):1930\u20131938","journal-title":"Int J Comp Tech Appl"},{"issue":"4","key":"9828_CR44","first-page":"143","volume":"5","author":"WBA Karaa","year":"2013","unstructured":"Karaa WBA (2013) A new stemmer to improve information retrieval. Int J Netw Secur Appl 5(4):143","journal-title":"Int J Netw Secur Appl"},{"issue":"4","key":"9828_CR45","doi-asserted-by":"crossref","first-page":"56","DOI":"10.1145\/2719920","volume":"47","author":"S Karimi","year":"2015","unstructured":"Karimi S, Wang C, Metke-Jimenez A, Gaire R, Paris C (2015) Text and data mining techniques in adverse drug reaction detection. ACM Comput Surv (CSUR) 47(4):56","journal-title":"ACM Comput Surv (CSUR)"},{"issue":"2","key":"9828_CR46","doi-asserted-by":"crossref","first-page":"571","DOI":"10.1007\/s11049-018-9419-y","volume":"37","author":"I Kastner","year":"2019","unstructured":"Kastner I (2019) Templatic morphology as an emergent property. Nat Lang Linguist Theory 37(2):571\u2013619","journal-title":"Nat Lang Linguist Theory"},{"issue":"7","key":"9828_CR47","first-page":"407","volume":"1","author":"A Khalid","year":"2016","unstructured":"Khalid A, Hussain Z, Baig MA (2016) Arabic stemmer for search engines information retrieval. Int J Adv Comput Sci Appl 1(7):407\u2013411","journal-title":"Int J Adv Comput Sci Appl"},{"key":"9828_CR1001","unstructured":"Khan S, Waqas A, Usama B, Xuan W (2015) Template based affix stemmer for a morphologically rich language. Int Arab J Inf Tech 12(2):146\u2013154"},{"key":"9828_CR48","volume-title":"Stemming arabic text","author":"S Khoja","year":"1999","unstructured":"Khoja S, Garside R (1999) Stemming arabic text. Lancaster University, Lancaster, UK, Computing Department"},{"issue":"1\u20132","key":"9828_CR49","doi-asserted-by":"crossref","first-page":"277","DOI":"10.1016\/S0004-3702(99)00101-0","volume":"118","author":"R Krovetz","year":"2000","unstructured":"Krovetz R (2000) Viewing morphology as an inference process. Artif intel 118(1\u20132):277\u2013294","journal-title":"Artif intel"},{"key":"9828_CR50","doi-asserted-by":"crossref","first-page":"221","DOI":"10.1007\/978-1-4020-6046-5_12","volume-title":"Arabic computational morphology","author":"LS Larkey","year":"2007","unstructured":"Larkey LS, Ballesteros L, Connell ME (2007) Light stemming for Arabic information retrieval. Arabic computational morphology. Springer, Dordrecht, pp 221\u2013243"},{"key":"9828_CR51","unstructured":"Lemur (2016) https:\/\/www.lemurproject.org. Accessed 14 Aug 2018"},{"issue":"4","key":"9828_CR52","doi-asserted-by":"crossref","first-page":"177","DOI":"10.1177\/016555158100300403","volume":"3","author":"M Lennon","year":"1981","unstructured":"Lennon M, Peirce DS, Tarry BD, Willett P (1981) An evaluation of some conflation algorithms for information retrieval. Inf Sci 3(4):177\u2013183","journal-title":"Inf Sci"},{"issue":"1\u20132","key":"9828_CR53","first-page":"22","volume":"11","author":"JB Lovins","year":"1968","unstructured":"Lovins JB (1968) Development of a stemming algorithm. Mech Transl Comput Linguist 11(1\u20132):22\u201331","journal-title":"Mech Transl Comput Linguist"},{"key":"9828_CR54","unstructured":"Lucene (2018) https:\/\/lucene.apache.org. Accessed 12 Aug 2018"},{"issue":"8","key":"9828_CR55","first-page":"90","volume":"17","author":"A Mateen","year":"2017","unstructured":"Mateen A, Malik MK, Nawaz Z, Danish HM, Siddiqui MH, Abbas Q (2017) A hybrid stemmer of punjabi shahmukhi script. Int J Comput Sci Netw Secur 17(8):90\u201397","journal-title":"Int J Comput Sci Netw Secur"},{"key":"9828_CR56","unstructured":"McCormick C (2016) Word2Vec tutorial\u2014the skip-gram model. https:\/\/www.mccormickml.com"},{"issue":"5","key":"9828_CR57","first-page":"711","volume":"4","author":"U Mishra","year":"2012","unstructured":"Mishra U, Prakash C (2012) MAULIK: an effective stemmer for Hindi language. Int J Comput Sci Eng 4(5):711\u2013717","journal-title":"Int J Comput Sci Eng"},{"issue":"2","key":"9828_CR58","doi-asserted-by":"crossref","first-page":"291","DOI":"10.1016\/S0346-251X(00)00013-0","volume":"28","author":"M Mochizuki","year":"2000","unstructured":"Mochizuki M, Aizawa K (2000) An affix acquisition order for EFL learners: an exploratory study. System 28(2):291\u2013304","journal-title":"System"},{"issue":"3","key":"9828_CR98","first-page":"450","volume":"11","author":"FM Moghadam","year":"2015","unstructured":"Moghadam FM, MohammadReza K  (2015) Comparative study of various Persian stemmers in the field of information retrieval. J Inf Proc Syst 11(3):450\u2013464","journal-title":"J inf proc syst"},{"key":"9828_CR59","unstructured":"Momenipour F, Keyvanpour MR (2016) PHMM: stemming on Persian texts using statistical stemmer based on hidden Markov Model. Int J Inf Sci Manag 14(2):107\u2013117"},{"issue":"1","key":"9828_CR60","doi-asserted-by":"crossref","first-page":"15","DOI":"10.1177\/0165551516683617","volume":"44","author":"AM Mustafa","year":"2018","unstructured":"Mustafa AM, Rashid TA (2018) Kurdish stemmer pre-processing steps for improving information retrieval. J Inf Sci 44(1):15\u201327","journal-title":"J Inf Sci"},{"key":"9828_CR61","first-page":"90","volume-title":"International conference on application of natural language to information systems","author":"DT Nguyen","year":"2013","unstructured":"Nguyen, (2013) Nguyen DT, Leveling J (2013) Exploring domain-sensitive features for extractive summarization in the medical domain. International conference on application of natural language to information systems. Springer, Berlin, pp 90\u2013101"},{"key":"9828_CR101","unstructured":"Nwesri AFA, Alyagoubi HAH (2015). Applying arabic stemming using query expansion. In 2015 26th international workshop on database and expert systems applications (DEXA) (pp. 299\u2013303). IEEE"},{"key":"9828_CR62","unstructured":"Orengo VM, Huyck C (2001) a stemming algorithm for the portuguese language. In; SPIRE '01: Proceedings of eigth symposium on string processing and information retrieval, pp 186\u2013193."},{"issue":"3","key":"9828_CR63","doi-asserted-by":"crossref","first-page":"56","DOI":"10.1145\/101306.101310","volume":"24","author":"CD Paice","year":"1990","unstructured":"Paice CD (1990) Another stemmer. SIGIR Forum 24(3):56\u201361","journal-title":"SIGIR Forum"},{"issue":"8","key":"9828_CR64","doi-asserted-by":"crossref","first-page":"632","DOI":"10.1002\/(SICI)1097-4571(199608)47:8<632::AID-ASI8>3.0.CO;2-U","volume":"47","author":"CD Paice","year":"1996","unstructured":"Paice CD (1996) Method for evaluation of stemming algorithms based on error counting. J Am Soc Inf Sci 47(8):632\u2013649","journal-title":"J Am Soc Inf Sci"},{"key":"9828_CR65","doi-asserted-by":"crossref","unstructured":"Paice CD (1994) An evaluation method for stemming algorithms. In: Proceedings of the 17th annual international ACM SIGIR conference on research and development in information retrieval. Springer, New York, pp 42\u201350","DOI":"10.1007\/978-1-4471-2099-5_5"},{"key":"9828_CR66","doi-asserted-by":"publisher","DOI":"10.1093\/llc\/fqy053","author":"BP Pande","year":"2018","unstructured":"Pande BP, Tamta P, Dhami HS (2018) Generation, implementation and appraisal of an N-gram based stemming algorithm. Digit Scholarsh Humanit. https:\/\/doi.org\/10.1093\/llc\/fqy053","journal-title":"Digit Scholarsh Humanit"},{"key":"9828_CR67","doi-asserted-by":"crossref","unstructured":"Paik JH, Pal D, Parui SK (2011) A novel corpus-based stemming algorithm using co-occurrence statistics. In: Proceedings of the 34th annual international ACM SIGIR conference on research and development in information retrieval (SIGIR\u201911). ACM, New York, pp 863\u2013872","DOI":"10.1145\/2009916.2010031"},{"issue":"7","key":"9828_CR68","first-page":"9","volume":"2","author":"CG Patil","year":"2013","unstructured":"Patil CG, Patil SS (2013) Use of Porter stemming algorithm and SVM for emotion extraction from news headlines. Int J Electron Commun Soft Comput Sci Eng 2(7):9\u201313","journal-title":"Int J Electron Commun Soft Comput Sci Eng"},{"key":"9828_CR69","unstructured":"Porter MF (2006) https:\/\/snowball.artarus.org\/algorithms\/english\/ stemmer.html"},{"issue":"3","key":"9828_CR70","doi-asserted-by":"crossref","first-page":"130","DOI":"10.1108\/eb046814","volume":"14","author":"MF Porter","year":"1980","unstructured":"Porter MF (1980) An algorithm for suffix stripping. Program 14(3):130\u2013137","journal-title":"Program"},{"issue":"2","key":"9828_CR97","first-page":"96","volume":"23","author":"AH Qureshi","year":"2018","unstructured":"Qureshi AH, Hassan MU, Akhter S (2018) Towards description of derivation in Urdu: morphological perspective. Al-Qalam 23(2):96\u2013100","journal-title":"Al-Qalam"},{"issue":"3","key":"9828_CR71","first-page":"165","volume":"4","author":"SPR Rani","year":"2015","unstructured":"Rani SPR, Ramesh B, Anusha M, Rani SJGR (2015) Evaluation of stemming techniques for text classification. Int J Comput Sci Mobile Comput 4(3):165\u2013171","journal-title":"Int J Comput Sci Mobile Comput"},{"key":"9828_CR72","doi-asserted-by":"crossref","first-page":"358","DOI":"10.1007\/978-981-10-2738-3_31","volume-title":"International symposium on security in computing and communication","author":"TA Rashid","year":"2016","unstructured":"Rashid TA, Mohamad SO (2016) Enhancement of detecting wicked website through intelligent methods. International symposium on security in computing and communication. Springer, Singapore, pp 358\u2013368"},{"key":"9828_CR73","doi-asserted-by":"crossref","unstructured":"Rashidi A, Lighvan MZ (2014) HPS: a hierarchical Persian stemming method. arXiv preprint arXiv:1403.2837.","DOI":"10.5121\/ijnlc.2014.3102"},{"issue":"8","key":"9828_CR74","doi-asserted-by":"crossref","first-page":"e68178","DOI":"10.1371\/journal.pone.0068178","volume":"8","author":"Z Rehman","year":"2013","unstructured":"Rehman Z, Anwar W, Bajwa UI, Xuan W, Chaoying Z (2013) Morpheme matching based text tokenization for a scarce resourced language. PLoS ONE 8(8):e68178","journal-title":"PLoS ONE"},{"key":"9828_CR75","first-page":"19","volume":"18","author":"MK Saad","year":"2010","unstructured":"Saad MK, Ashour W (2010) Arabic morphological tools for text mining. Corpora 18:19","journal-title":"Corpora"},{"issue":"2","key":"9828_CR76","doi-asserted-by":"crossref","first-page":"99","DOI":"10.1007\/s42044-018-0007-4","volume":"1","author":"AM Saeed","year":"2018","unstructured":"Saeed AM, Rashid TA, Mustafa AM, Al-Rashid Agha RA, Shamsaldin AS, Al-Salihi NK (2018a) An evaluation of Reber stemmer with longest match stemmer technique in Kurdish Sorani text classification. Iran J Comput Sci 1(2):99\u2013107","journal-title":"Iran J Comput Sci"},{"issue":"1","key":"9828_CR77","doi-asserted-by":"crossref","first-page":"48","DOI":"10.25079\/ukhjse.v2n1y2018.pp48-54","volume":"2","author":"AM Saeed","year":"2018","unstructured":"Saeed AM, Rashid TA, Mustafa AM, Fattah P, Ismael B (2018b) Improving Kurdish web mining through tree data structure and Porter\u2019s Stemmer algorithms. UKH J Sci Eng 2(1):48\u201354","journal-title":"UKH J Sci Eng"},{"issue":"9","key":"9828_CR78","first-page":"213","volume":"4","author":"B Sarma","year":"2013","unstructured":"Sarma B, Purkayastha BS (2013) An affix based word classification method of assamese text. Int J Adv Res Comput Sci 4(9):213\u2013216","journal-title":"Int J Adv Res Comput Sci"},{"key":"9828_CR79","doi-asserted-by":"crossref","first-page":"287","DOI":"10.1162\/tacl_a_00099","volume":"4","author":"A Schofield","year":"2016","unstructured":"Schofield A, Mimno D (2016) Comparing apples to apple: the effects of stemmers on topic models. Trans Assoc Comput Linguist 4:287\u2013300","journal-title":"Trans Assoc Comput Linguist"},{"key":"9828_CR80","doi-asserted-by":"crossref","unstructured":"Setiawan R, Kurniawan A, Budiharto W, Kartowisastro IH, Prabowo H (2016) Flexible affix classification for stemming Indonesian Language. In: 2016 13th international conference on electrical engineering\/electronics, computer, telecommunications and information technology (ECTI-CON). IEEE, pp 1\u20136","DOI":"10.1109\/ECTICon.2016.7561257"},{"issue":"3","key":"9828_CR81","doi-asserted-by":"crossref","first-page":"45","DOI":"10.1145\/2975608","volume":"49","author":"J Singh","year":"2016","unstructured":"Singh J, Gupta V (2016) Text stemming: approaches, applications, and challenges. ACM Comput Surv (CSUR) 49(3):45","journal-title":"ACM Comput Surv (CSUR)"},{"issue":"5","key":"9828_CR82","doi-asserted-by":"crossref","first-page":"671","DOI":"10.1007\/s12559-017-9479-z","volume":"9","author":"J Singh","year":"2017","unstructured":"Singh J, Gupta V (2017) An efficient corpus-based stemmer. Cognit Comput 9(5):671\u2013688","journal-title":"Cognit Comput"},{"issue":"2","key":"9828_CR83","first-page":"265","volume":"4","author":"SR Sirsat","year":"2013","unstructured":"Sirsat SR, Chavan V, Mahalle HS (2013) Strength and accuracy analysis of affix removal stemming algorithms. Int J Comput Sci Inf Technol 4(2):265\u2013269","journal-title":"Int J Comput Sci Inf Technol"},{"issue":"2","key":"9828_CR84","first-page":"6","volume":"13","author":"S Sulaiman","year":"2014","unstructured":"Sulaiman S, Omar K, Omar N, Murah MZ, Abdul Rahman HD (2014) The effectiveness of a Jawi stemmer for retrieving relevant Malay documents in Jawi characters. ACM Trans Asian Lang Inf Process (TALIP) 13(2):6","journal-title":"ACM Trans Asian Lang Inf Process (TALIP)"},{"issue":"4","key":"9828_CR85","first-page":"27","volume":"17","author":"AA Suryani","year":"2018","unstructured":"Suryani AA, Widyantoro DW, Purwarianti A, Sudaryat Y (2018) The rule-based sundanese stemmer. ACM Trans Asian Low-Resour Lang Inf Process (TALLIP) 17(4):27","journal-title":"ACM Trans Asian Low-Resour Lang Inf Process (TALLIP)"},{"issue":"1","key":"9828_CR86","first-page":"209","volume":"32","author":"H Taghi-Zadeh","year":"2015","unstructured":"Taghi-Zadeh H, Sadreddini MH, Diyanati MH, Rasekh AH (2015) A new hybrid stemming method for persian language. Digit Scholarsh Humanit 32(1):209\u2013221","journal-title":"Digit Scholarsh Humanit"},{"issue":"7","key":"9828_CR87","first-page":"812","volume":"3","author":"M Thangarasu","year":"2013","unstructured":"Thangarasu M, Manavalan R (2013) Design and development of stemmer for Tamil language: cluster analysis. Int J Adv Res Comput Sci Softw Eng 3(7):812\u2013818","journal-title":"Int J Adv Res Comput Sci Softw Eng"},{"key":"9828_CR88","unstructured":"The free dictionary (2018) https:\/\/www.thefreedictionary.com\/. Accessed 03 Aug 2018"},{"key":"9828_CR89","doi-asserted-by":"crossref","unstructured":"Qunis I, Amati G, Plachouras V, He B, Macdonald C, Lioma C (2006) A high performance and scalable information retrieval plateform. In: SIGR workshop on open source information retrieval","DOI":"10.1007\/978-3-540-31865-1_37"},{"key":"9828_CR90","unstructured":"Urdu L (2006) https:\/\/182.180.102.251:8081\/oud\/help_3.htm. Accessed 04 Aug 2018"},{"key":"9828_CR91","unstructured":"Xapian (2018) https:\/\/xapian.org. Accessed 07 Aug 2018"},{"key":"9828_CR92","unstructured":"Xer (1994) Xeror linguistic database reference, English version 1.1.4 ed.s"},{"issue":"2","key":"9828_CR93","doi-asserted-by":"crossref","first-page":"25","DOI":"10.1145\/3057270","volume":"50","author":"A Yadollahi","year":"2017","unstructured":"Yadollahi A, Shahraki AG, Zaiane OR (2017) Current state of text sentiment analysis from opinion to emotion mining. ACM Comput Surv (CSUR) 50(2):25","journal-title":"ACM Comput Surv (CSUR)"},{"key":"9828_CR94","unstructured":"Zerrouki T (2016) Tashaphyne 0.2 (Online). https:\/\/pypi.python.org\/pypi\/Tashaphyne. Accessed 14 Apr 2016"},{"issue":"1","key":"9828_CR95","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/2379776.2379777","volume":"45","author":"D Zhou","year":"2012","unstructured":"Zhou D, Mark T, Brailsford T, Wade V, Ashman H (2012) Translation techniques in cross-language information retrieval. ACM Comput Surv (CSUR) 45(1):1","journal-title":"ACM Comput Surv (CSUR)"}],"container-title":["Artificial Intelligence Review"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-020-09828-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10462-020-09828-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-020-09828-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,4,15]],"date-time":"2021-04-15T08:20:39Z","timestamp":1618474839000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10462-020-09828-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,4,15]]},"references-count":103,"journal-issue":{"issue":"8","published-print":{"date-parts":[[2020,12]]}},"alternative-id":["9828"],"URL":"https:\/\/doi.org\/10.1007\/s10462-020-09828-3","relation":{},"ISSN":["0269-2821","1573-7462"],"issn-type":[{"value":"0269-2821","type":"print"},{"value":"1573-7462","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,4,15]]},"assertion":[{"value":"15 April 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}