{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,25]],"date-time":"2025-11-25T08:54:58Z","timestamp":1764060898300,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":34,"publisher":"ACM","license":[{"start":{"date-parts":[[2019,10,23]],"date-time":"2019-10-23T00:00:00Z","timestamp":1571788800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2019,10,23]]},"DOI":"10.1145\/3372938.3372998","type":"proceedings-article","created":{"date-parts":[[2020,1,8]],"date-time":"2020-01-08T03:54:01Z","timestamp":1578455641000},"page":"1-6","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":21,"title":["A comparison of features extraction methods for Arabic sentiment analysis"],"prefix":"10.1145","author":[{"given":"Mohammed","family":"Kasri","sequence":"first","affiliation":[{"name":"Department of Computer Sciences, University of Chouaib Doukkali, El Jadida Morocco"}]},{"given":"Marouane","family":"Birjali","sequence":"additional","affiliation":[{"name":"Department of Computer Sciences, University of Chouaib Doukkali, El Jadida Morocco"}]},{"given":"Abderrahim","family":"Beni-Hssane","sequence":"additional","affiliation":[{"name":"Department of Computer Sciences, University of Chouaib Doukkali, El Jadida Morocco"}]}],"member":"320","published-online":{"date-parts":[[2020,1,7]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N16-3003"},{"key":"#cr-split#-e_1_3_2_1_2_1.1","doi-asserted-by":"crossref","unstructured":"Shereen Albitar S\u00e9bastien Fournier and Bernard Espinasse. 2014. An Effective TF\/IDF-Based Text-to-Text Semantic Similarity Measure for Text Classification.. 105--114. DOI:https:\/\/doi.org\/10.1007\/978-3-319-11749-2_8 10.1007\/978-3-319-11749-2_8","DOI":"10.1007\/978-3-319-11749-2_8"},{"key":"#cr-split#-e_1_3_2_1_2_1.2","doi-asserted-by":"crossref","unstructured":"Shereen Albitar S\u00e9bastien Fournier and Bernard Espinasse. 2014. An Effective TF\/IDF-Based Text-to-Text Semantic Similarity Measure for Text Classification.. 105--114. DOI:https:\/\/doi.org\/10.1007\/978-3-319-11749-2_8","DOI":"10.1007\/978-3-319-11749-2_8"},{"key":"#cr-split#-e_1_3_2_1_3_1.1","doi-asserted-by":"crossref","unstructured":"Marouane Birjali Abderrahim Beni-Hssane and Mohammed Erritali. 2017. Machine Learning and Semantic Sentiment Analysis based Algorithms for Suicide Sentiment Prediction in Social Networks. Procedia Comput. Sci. 113 (2017) 65--72. DOI:https:\/\/doi.org\/10.1016\/j.procs.2017.08.290 10.1016\/j.procs.2017.08.290","DOI":"10.1016\/j.procs.2017.08.290"},{"key":"#cr-split#-e_1_3_2_1_3_1.2","doi-asserted-by":"crossref","unstructured":"Marouane Birjali Abderrahim Beni-Hssane and Mohammed Erritali. 2017. Machine Learning and Semantic Sentiment Analysis based Algorithms for Suicide Sentiment Prediction in Social Networks. Procedia Comput. Sci. 113 (2017) 65--72. DOI:https:\/\/doi.org\/10.1016\/j.procs.2017.08.290","DOI":"10.1016\/j.procs.2017.08.290"},{"key":"#cr-split#-e_1_3_2_1_4_1.1","doi-asserted-by":"crossref","unstructured":"Marouane Birjali Abderrahim Beni-Hssane and Mohammed Erritali. 2017. Analyzing Social Media through Big Data using InfoSphere BigInsights and Apache Flume. Procedia Comput. Sci. 113 (2017) 280--285. DOI:https:\/\/doi.org\/10.1016\/j.procs.2017.08.299 10.1016\/j.procs.2017.08.299","DOI":"10.1016\/j.procs.2017.08.299"},{"key":"#cr-split#-e_1_3_2_1_4_1.2","doi-asserted-by":"crossref","unstructured":"Marouane Birjali Abderrahim Beni-Hssane and Mohammed Erritali. 2017. Analyzing Social Media through Big Data using InfoSphere BigInsights and Apache Flume. Procedia Comput. Sci. 113 (2017) 280--285. DOI:https:\/\/doi.org\/10.1016\/j.procs.2017.08.299","DOI":"10.1016\/j.procs.2017.08.299"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2018.04.030"},{"key":"e_1_3_2_1_6_1","volume-title":"Jordan","author":"Blei David M.","year":"2003","unstructured":"David M. Blei , Andrew Y. Ng , and Michael I . Jordan . 2003 . Latent Dirichlet allocation. J. Mach. Learn. Res . (2003). DOI:https:\/\/doi.org\/10.1016\/b978-0-12-411519-4.00006-9 10.1016\/b978-0-12-411519-4.00006-9 David M. Blei, Andrew Y. Ng, and Michael I. Jordan. 2003. Latent Dirichlet allocation. J. Mach. Learn. Res. (2003). DOI:https:\/\/doi.org\/10.1016\/b978-0-12-411519-4.00006-9"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1016\/S1532-0464(03)00034-0"},{"key":"e_1_3_2_1_8_1","first-page":"210","article-title":"Social Network Sites: Definition, History, and Scholarship","volume":"13","author":"Ellison Nicole B.","year":"2007","unstructured":"Nicole B. Ellison and Danah M. Boyd . 2007 . Social Network Sites: Definition, History, and Scholarship . J. Comput. Commun. 13 , 1 (2007), 210 -- 230 . DOI:https:\/\/doi.org\/10.1111\/j.1083-6101.2007.00393.x 10.1111\/j.1083-6101.2007.00393.x Nicole B. Ellison and Danah M. Boyd. 2007. Social Network Sites: Definition, History, and Scholarship. J. Comput. Commun. 13, 1 (2007), 210--230. DOI:https:\/\/doi.org\/10.1111\/j.1083-6101.2007.00393.x","journal-title":"J. Comput. Commun."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/AICCSA.2016.7945800"},{"key":"e_1_3_2_1_10_1","series-title":"Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics). DOI:https:\/\/doi.org\/10.1007\/978-3-319-66854-3_20","volume-title":"Collecting and processing arabic facebook comments for sentiment analysis","author":"Elouardighi Abdeljalil","unstructured":"Abdeljalil Elouardighi , Mohcine Maghfour , and Hafdalla Hammia . 2017. Collecting and processing arabic facebook comments for sentiment analysis . In Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics). DOI:https:\/\/doi.org\/10.1007\/978-3-319-66854-3_20 10.1007\/978-3-319-66854-3_20 Abdeljalil Elouardighi, Mohcine Maghfour, and Hafdalla Hammia. 2017. Collecting and processing arabic facebook comments for sentiment analysis. In Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics). DOI:https:\/\/doi.org\/10.1007\/978-3-319-66854-3_20"},{"key":"e_1_3_2_1_11_1","first-page":"5","article-title":"An Approach of Semantic Similarity Measure between Documents Based on Big","volume":"6","author":"Erritali Mohammed","year":"2016","unstructured":"Mohammed Erritali , Abderrahim Beni-Hssane , Marouane Birjali , and Youness Madani . 2016 . An Approach of Semantic Similarity Measure between Documents Based on Big Data. Int. J. Electr. Comput. Eng. 6 , 5 (October 2016), 2454. DOI:https:\/\/doi.org\/10.11591\/ijece.v6i5.10853 10.11591\/ijece.v6i5.10853 Mohammed Erritali, Abderrahim Beni-Hssane, Marouane Birjali, and Youness Madani. 2016. An Approach of Semantic Similarity Measure between Documents Based on Big Data. Int. J. Electr. Comput. Eng. 6, 5 (October 2016), 2454. DOI:https:\/\/doi.org\/10.11591\/ijece.v6i5.10853","journal-title":"Data. Int. J. Electr. Comput. Eng."},{"key":"e_1_3_2_1_12_1","volume-title":"The Digital Universe","author":"Gantz John","year":"2020","unstructured":"John Gantz , David Reinsel , and Bigger Digital Shadows . 2012. The Digital Universe in 2020 . IDC iView \"Big Data, Bigger Digit. Shad. Biggest Growth Far East \" (2012). John Gantz, David Reinsel, and Bigger Digital Shadows. 2012. The Digital Universe in 2020. IDC iView \"Big Data, Bigger Digit. Shad. Biggest Growth Far East\" (2012)."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-006-6226-1"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1080\/00437956.1954.11659520"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/SAI.2014.6918213"},{"key":"e_1_3_2_1_16_1","volume-title":"31st International Conference on Machine Learning, ICML","author":"Le Quoc","year":"2014","unstructured":"Quoc Le and Tomas Mikolov . 2014 . Distributed representations of sentences and documents . In 31st International Conference on Machine Learning, ICML 2014. Quoc Le and Tomas Mikolov. 2014. Distributed representations of sentences and documents. In 31st International Conference on Machine Learning, ICML 2014."},{"key":"#cr-split#-e_1_3_2_1_17_1.1","doi-asserted-by":"crossref","unstructured":"Bing Liu. 2012. Sentiment analysis and opinion mining. Synth. Lect. Hum. Lang. Technol. (2012). DOI:https:\/\/doi.org\/10.2200\/S00416ED1V01Y201204HLT016 10.2200\/S00416ED1V01Y201204HLT016","DOI":"10.2200\/S00416ED1V01Y201204HLT016"},{"key":"#cr-split#-e_1_3_2_1_17_1.2","doi-asserted-by":"crossref","unstructured":"Bing Liu. 2012. Sentiment analysis and opinion mining. Synth. Lect. Hum. Lang. Technol. (2012). DOI:https:\/\/doi.org\/10.2200\/S00416ED1V01Y201204HLT016","DOI":"10.2200\/S00416ED1V01Y201204HLT016"},{"key":"e_1_3_2_1_18_1","unstructured":"Avinash Madasu and Sivasankar E. 2019. A Study of Feature Extraction techniques for Sentiment Analysis. (June 2019). Retrieved from http:\/\/arxiv.org\/abs\/1906.01573  Avinash Madasu and Sivasankar E. 2019. A Study of Feature Extraction techniques for Sentiment Analysis. (June 2019). Retrieved from http:\/\/arxiv.org\/abs\/1906.01573"},{"key":"e_1_3_2_1_19_1","volume-title":"Efficient Estimation of Word Representations in Vector Space. (January","author":"Mikolov Tomas","year":"2013","unstructured":"Tomas Mikolov , Kai Chen , Greg Corrado , and Jeffrey Dean . 2013. Efficient Estimation of Word Representations in Vector Space. (January 2013 ). Retrieved from http:\/\/arxiv.org\/abs\/1301.3781 Tomas Mikolov, Kai Chen, Greg Corrado, and Jeffrey Dean. 2013. Efficient Estimation of Word Representations in Vector Space. (January 2013). Retrieved from http:\/\/arxiv.org\/abs\/1301.3781"},{"key":"e_1_3_2_1_20_1","unstructured":"Tomas Mikolov Ilya Sutskever Kai Chen Greg Corrado and Jeffrey Dean. 2013. Distributed representations of words and phrases and their compositionality. In Advances in Neural Information Processing Systems.  Tomas Mikolov Ilya Sutskever Kai Chen Greg Corrado and Jeffrey Dean. 2013. Distributed representations of words and phrases and their compositionality. In Advances in Neural Information Processing Systems."},{"key":"e_1_3_2_1_21_1","volume-title":"LABR: A Large Scale Arabic Sentiment Analysis Benchmark. arXiv.org (November","author":"Nabil Mahmoud","year":"2014","unstructured":"Mahmoud Nabil , Mohamed Aly , and Amir Atiya . 2014 . LABR: A Large Scale Arabic Sentiment Analysis Benchmark. arXiv.org (November 2014). Retrieved from https:\/\/arxiv.org\/abs\/1411.6718v2 Mahmoud Nabil, Mohamed Aly, and Amir Atiya. 2014. LABR: A Large Scale Arabic Sentiment Analysis Benchmark. arXiv.org (November 2014). Retrieved from https:\/\/arxiv.org\/abs\/1411.6718v2"},{"key":"e_1_3_2_1_22_1","volume-title":"ADCS 2009 - Proc. Fourteenth Australas. Doc. Comput. Symp.","author":"O'Keefe Tim","year":"2009","unstructured":"Tim O'Keefe and Irena Koprinska . 2009 . Feature selection and weighting methods in sentiment analysis . ADCS 2009 - Proc. Fourteenth Australas. Doc. Comput. Symp. (2009). Tim O'Keefe and Irena Koprinska. 2009. Feature selection and weighting methods in sentiment analysis. ADCS 2009 - Proc. Fourteenth Australas. Doc. Comput. Symp. (2009)."},{"key":"e_1_3_2_1_23_1","volume-title":"El-Beltagy","author":"Soliman Abu Bakr","year":"2017","unstructured":"Abu Bakr Soliman , Kareem Eissa , and Samhaa R . El-Beltagy . 2017 . AraVec: A set of Arabic Word Embedding Models for use in Arabic NLP. Procedia Comput. Sci . 117, (2017), 256--265. DOI:https:\/\/doi.org\/10.1016\/j.procs.2017.10.117 10.1016\/j.procs.2017.10.117 Abu Bakr Soliman, Kareem Eissa, and Samhaa R. El-Beltagy. 2017. AraVec: A set of Arabic Word Embedding Models for use in Arabic NLP. Procedia Comput. Sci. 117, (2017), 256--265. DOI:https:\/\/doi.org\/10.1016\/j.procs.2017.10.117"},{"key":"e_1_3_2_1_24_1","first-page":"1","article-title":"A STATISTICAL INTERPRETATION OF TERM SPECIFICITY AND ITS APPLICATION IN RETRIEVAL","volume":"28","author":"KAREN SPARCK","year":"1972","unstructured":"KAREN SPARCK JONES. 1972 . A STATISTICAL INTERPRETATION OF TERM SPECIFICITY AND ITS APPLICATION IN RETRIEVAL . J. Doc. 28 , 1 (January 1972), 11--21. DOI:https:\/\/doi.org\/10.1108\/eb026526 10.1108\/eb026526 KAREN SPARCK JONES. 1972. A STATISTICAL INTERPRETATION OF TERM SPECIFICITY AND ITS APPLICATION IN RETRIEVAL. J. Doc. 28, 1 (January 1972), 11--21. DOI:https:\/\/doi.org\/10.1108\/eb026526","journal-title":"J. Doc."},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/DSC.2016.110"},{"key":"#cr-split#-e_1_3_2_1_26_1.1","doi-asserted-by":"crossref","unstructured":"Jihong Yan Muammer Ko\u00e7 and Jay Lee. 2004. A prognostic algorithm for machine performance assessment and its application. In Production Planning and Control. DOI:https:\/\/doi.org\/10.1080\/09537280412331309208 10.1080\/09537280412331309208","DOI":"10.1080\/09537280412331309208"},{"key":"#cr-split#-e_1_3_2_1_26_1.2","doi-asserted-by":"crossref","unstructured":"Jihong Yan Muammer Ko\u00e7 and Jay Lee. 2004. A prognostic algorithm for machine performance assessment and its application. In Production Planning and Control. DOI:https:\/\/doi.org\/10.1080\/09537280412331309208","DOI":"10.1080\/09537280412331309208"},{"key":"#cr-split#-e_1_3_2_1_27_1.1","doi-asserted-by":"crossref","unstructured":"Cha Zhang and Yunqian Ma (Eds.). 2012. Ensemble Machine Learning. Springer US Boston MA. DOI:https:\/\/doi.org\/10.1007\/978-1-4419-9326-7 10.1007\/978-1-4419-9326-7","DOI":"10.1007\/978-1-4419-9326-7"},{"key":"#cr-split#-e_1_3_2_1_27_1.2","doi-asserted-by":"crossref","unstructured":"Cha Zhang and Yunqian Ma (Eds.). 2012. Ensemble Machine Learning. Springer US Boston MA. DOI:https:\/\/doi.org\/10.1007\/978-1-4419-9326-7","DOI":"10.1007\/978-1-4419-9326-7"},{"key":"e_1_3_2_1_28_1","first-page":"3","article-title":"A comparative study of TF-IDF, LSI and multi-words for text classification","volume":"38","author":"Zhang Wen","year":"2011","unstructured":"Wen Zhang , Taketoshi Yoshida , and Xijin Tang . 2011 . A comparative study of TF-IDF, LSI and multi-words for text classification . Expert Syst. Appl. 38 , 3 (March 2011), 2758--2765. DOI:https:\/\/doi.org\/10.1016\/j.eswa.2010.08.066 10.1016\/j.eswa.2010.08.066 Wen Zhang, Taketoshi Yoshida, and Xijin Tang. 2011. A comparative study of TF-IDF, LSI and multi-words for text classification. Expert Syst. Appl. 38, 3 (March 2011), 2758--2765. DOI:https:\/\/doi.org\/10.1016\/j.eswa.2010.08.066","journal-title":"Expert Syst. Appl."}],"event":{"name":"BDIoT'19: The 4th International Conference On Big Data and Internet of Things","acronym":"BDIoT'19","location":"Rabat Morocco"},"container-title":["Proceedings of the 4th International Conference on Big Data and Internet of Things"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3372938.3372998","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3372938.3372998","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T17:49:58Z","timestamp":1750268998000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3372938.3372998"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,10,23]]},"references-count":34,"alternative-id":["10.1145\/3372938.3372998","10.1145\/3372938"],"URL":"https:\/\/doi.org\/10.1145\/3372938.3372998","relation":{},"subject":[],"published":{"date-parts":[[2019,10,23]]},"assertion":[{"value":"2020-01-07","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}