{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,9]],"date-time":"2024-10-09T04:36:23Z","timestamp":1728448583156},"reference-count":26,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2023,11,1]],"date-time":"2023-11-01T00:00:00Z","timestamp":1698796800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,11,1]],"date-time":"2023-11-01T00:00:00Z","timestamp":1698796800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Data Sci Anal"],"published-print":{"date-parts":[[2024,10]]},"DOI":"10.1007\/s41060-023-00460-2","type":"journal-article","created":{"date-parts":[[2023,11,1]],"date-time":"2023-11-01T19:02:23Z","timestamp":1698865343000},"page":"393-403","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["FLICs (Facebook Language Informal Corpus): a novel dataset for informal language"],"prefix":"10.1007","volume":"18","author":[{"given":"Francis","family":"Rakotomalala","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Aim\u00e9 Richard","family":"Hajalalaina","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Manda Vy","family":"Ravonimanantsoa Ndaohialy","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Anselme","family":"Andriavelonera Alexandre","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andriatina H.","family":"Ranaivoson","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,11,1]]},"reference":[{"key":"460_CR1","doi-asserted-by":"crossref","unstructured":"Baaqeel H., Zagrouba, R., et al.: Hybrid SMS spam filtering system using machine learning techniques. In: 2020 21st International Arab Conference on Information Technology (ACIT), pp. 1\u20138. (2020)","DOI":"10.1109\/ACIT50332.2020.9300071"},{"issue":"1","key":"460_CR2","first-page":"1","volume":"1","author":"H Sajedi","year":"2016","unstructured":"Sajedi, H., Parast, G.Z., Akbari, F.: Sms spam filtering using machine learning techniques: A survey. Mach. Learn. Res. 1(1), 1\u201314 (2016)","journal-title":"Mach. Learn. Res."},{"key":"460_CR3","unstructured":"Twitter Sentiment Classification using Distant Supervision - Google Scholar. https:\/\/scholar.google.com\/scholar?hl=fr&as_sdt=0%2C5&q=Twitter+Sentiment+Classification+using+Distant+Supervision&btnG= (consult\u00e9 le 4 mars 2023)."},{"key":"460_CR4","unstructured":"Pak A., Paroubek, P.: Twitter as a corpus for sentiment analysis and opinion mining. In: LREc, vol. 10, pp. 1320\u20131326 (2010)."},{"key":"460_CR5","doi-asserted-by":"crossref","unstructured":"Danescu-Niculescu-Mizil, C., West, R., Jurafsky, D., Leskovec, J., Potts, C.: No country for old members: User lifecycle and linguistic change in online communities. In: Proceedings of the 22nd International Conference on World Wide Web, pp. 307\u2013318 (2013).","DOI":"10.1145\/2488388.2488416"},{"key":"460_CR6","doi-asserted-by":"crossref","unstructured":"Li, J., Galley, M., Brockett, C., Spithourakis, G.P., Gao, J., Dolan, B.: A persona-based neural conversation model. ArXiv Prepr. ArXiv160306155, (2016).","DOI":"10.18653\/v1\/P16-1094"},{"key":"460_CR7","doi-asserted-by":"crossref","unstructured":"Zhang, S., Dinan, E., Urbanek, J., Szlam, A., Kiela, D., Weston, J.: Personalizing dialogue agents: I have a dog, do you have pets too? ArXiv Prepr. ArXiv180107243 (2018).","DOI":"10.18653\/v1\/P18-1205"},{"key":"460_CR8","doi-asserted-by":"crossref","unstructured":"Liu Q., et al.: You impress me: Dialogue generation via mutual persona perception, ArXiv Prepr. ArXiv200405388 (2020).","DOI":"10.18653\/v1\/2020.acl-main.131"},{"key":"460_CR9","doi-asserted-by":"crossref","unstructured":"Baumgartner, J., Zannettou, S., Keegan, B., Squire, M., Blackburn, J.: The pushshift reddit dataset. In: Proceedings of the International AAAI Conference on Web and Social Media, vol. 14, pp. 830\u2013839 (2020).","DOI":"10.1609\/icwsm.v14i1.7347"},{"key":"460_CR10","doi-asserted-by":"crossref","unstructured":"Setty, V., Rekve, E.: Truth be told: Fake news detection using user reactions on reddit. In: Proceedings of the 29th ACM International Conference on Information & Knowledge Management, pp. 3325\u20133328 (2020)","DOI":"10.1145\/3340531.3417463"},{"key":"460_CR11","unstructured":"Lample, G., Conneau, A., Denoyer, L., Ranzato, M.: Unsupervised machine translation using monolingual corpora only. ArXiv Prepr. ArXiv171100043 (2017)"},{"key":"460_CR12","doi-asserted-by":"crossref","unstructured":"Barbieri, F., Camacho-Collados, J., Neves, L., Espinosa-Anke, L.: Tweeteval: Unified benchmark and comparative evaluation for tweet classification. ArXiv Prepr. ArXiv201012421 (2020)","DOI":"10.18653\/v1\/2020.findings-emnlp.148"},{"key":"460_CR13","doi-asserted-by":"crossref","unstructured":"Solorio, T., et al.: Overview for the first shared task on language identification in code-switched data. In: Proceedings of the First Workshop on Computational Approaches to Code Switching, pp. 62\u201372 (2014).","DOI":"10.3115\/v1\/W14-3907"},{"key":"460_CR14","unstructured":"Ross, B., Rist, M., Carbonell, G., Cabrera, B., Kurowsky, N., Wojatzki, M.: Measuring the reliability of hate speech annotations: The case of the European refugee crisis. ArXiv Prepr. ArXiv170108118 (2017)"},{"key":"460_CR15","doi-asserted-by":"crossref","unstructured":"Klinger, R., De Clercq, O., Mohammad, S. M., Balahur, A.: IEST: WASSA-2018 implicit emotions shared task. ArXiv Prepr. ArXiv180901083 (2018).","DOI":"10.18653\/v1\/W18-6206"},{"key":"460_CR16","unstructured":"Rakotoson, H. et al.: Creation of a reference corpus for the Malagasy language. In: Proceedings of the 10th Language Resources and Evaluation Conference (LREC 2016), Portoro\u017e, Slovenia, pp. 1733\u20131740 (2016)"},{"key":"460_CR17","unstructured":"Ralison, A. et al.: Annotation and analysis of the Corpus of Malagasy Informal Texts (COTMI). In: Proceedings of the Workshop on Language Technologies for African Languages (AfLaT 2017), Valencia, Spain, pp. 39\u201344. (2017)"},{"key":"460_CR18","unstructured":"Razafindramanana, L. et al.: Building and analyzing a corpus of Malagasy texts from the web. In: Proceedings of the 7th Workshop on Balto-Slavic Natural Language Processing (BSNLP 2019), Florence, Italy, pp. 62\u201370 (2019)."},{"key":"460_CR19","unstructured":"Rakotoarisoa, J.-B., et al.: Building and analyzing a corpus of Malagasy journalistic texts. In: Proceedings of 4th Workshop Computational Linguistics Ural. Languages CoLU 2019 Turku Finl. pp 102\u2013108 (2019)"},{"key":"460_CR20","unstructured":"Mikolov, T., Sutskever, I., Chen, K., Corrado, G.S., Dean, J.: Distributed representations of words and phrases and their compositionality. Adv. Neural Inf. Process. Syst. 26 (2013)"},{"key":"460_CR21","unstructured":"Mikolov, T., Le, Q.V., Sutskever, I.: Exploiting similarities among languages for machine translation. ArXiv Prepr. ArXiv13094168 (2013)"},{"key":"460_CR22","unstructured":"Kim, K., et al.: A deep learning approach for sentiment analysis in informal language (2019)."},{"key":"460_CR23","unstructured":"Marcoux, R., Richard, L., Wolff, A.: Estimation des populations francophones dans le monde en. Sources D\u00e9marches M\u00e9thodologiques (2022)"},{"key":"460_CR24","unstructured":"Wolf, A.: La langue fran\u00e7aise dans le monde. Organisation internationale de la Francophonie (2014)."},{"key":"460_CR25","doi-asserted-by":"crossref","unstructured":"Ling, W., Dyer, C., Black, A.W., Trancoso, I.: Two\/too simple adaptations of word2vec for syntax problems. In: Proceedings of the 2015 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 1299\u20131304 (2015)","DOI":"10.3115\/v1\/N15-1142"},{"key":"460_CR26","doi-asserted-by":"crossref","unstructured":"Bustamam, A., Tasman, H., Yuniarti, N., Frisca, F., Mursidah, I.: Application of k-means clustering algorithm in grouping the DNA sequences of hepatitis B virus (HBV). In: AIP Conference Proceedings, AIP Publishing (2017)","DOI":"10.1063\/1.4991238"}],"container-title":["International Journal of Data Science and Analytics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-023-00460-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s41060-023-00460-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-023-00460-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,9]],"date-time":"2024-10-09T02:12:40Z","timestamp":1728439960000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s41060-023-00460-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,11,1]]},"references-count":26,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2024,10]]}},"alternative-id":["460"],"URL":"https:\/\/doi.org\/10.1007\/s41060-023-00460-2","relation":{},"ISSN":["2364-415X","2364-4168"],"issn-type":[{"type":"print","value":"2364-415X"},{"type":"electronic","value":"2364-4168"}],"subject":[],"published":{"date-parts":[[2023,11,1]]},"assertion":[{"value":"1 April 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 September 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 November 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declaration"}},{"value":"The authors have no conflicts of interest to declare that are relevant to the content of this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}