{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,10]],"date-time":"2025-12-10T16:01:20Z","timestamp":1765382480681,"version":"3.37.3"},"reference-count":36,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2023,9,15]],"date-time":"2023-09-15T00:00:00Z","timestamp":1694736000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,9,15]],"date-time":"2023-09-15T00:00:00Z","timestamp":1694736000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-023-16491-7","type":"journal-article","created":{"date-parts":[[2023,9,15]],"date-time":"2023-09-15T01:01:57Z","timestamp":1694739717000},"page":"31279-31295","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Incorporating Word Embedding and Hybrid Model Random Forest Softmax Regression for Predicting News Categories"],"prefix":"10.1007","volume":"83","author":[{"given":"Saima","family":"Khosa","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Furqan","family":"Rustam","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Arif","family":"Mehmood","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Gyu Sang","family":"Choi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8271-6496","authenticated-orcid":false,"given":"Imran","family":"Ashraf","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,9,15]]},"reference":[{"key":"16491_CR1","unstructured":"BBC (2022) Bbc news dataset available online. [Online]. Available: http:\/\/mlg.ucd.ie\/datasets\/bbc.html"},{"key":"16491_CR2","doi-asserted-by":"crossref","unstructured":"B\u00edr\u00f3 I, Sikl\u00f3si D, Szab\u00f3 J, Bencz\u00far AA (2009) Linked latent dirichlet allocation in web spam filtering. In: Proceedings of the 5th International Workshop on Adversarial Information Retrieval on the Web, p 37\u201340","DOI":"10.1145\/1531914.1531922"},{"key":"16491_CR3","doi-asserted-by":"crossref","unstructured":"Bounabi M, El\u00a0Moutaouakil K, Satori K (2017) A comparison of text classification methods method of weighted terms selected by different stemming techniques. In: Proceedings of the 2nd international Conference on Big Data, Cloud and Applications, p 1\u20139","DOI":"10.1145\/3090354.3090398"},{"key":"16491_CR4","unstructured":"Breiman L, Freidman J, Olshen R, Stone C (1984) Classification and regression trees. wadsworth, monterey, ca. Classification and regression trees. Wadsworth, Monterey, CA"},{"key":"16491_CR5","doi-asserted-by":"crossref","unstructured":"Dadgar SMH, Araghi MS, Farahani MM (2016) A novel text mining approach based on tf-idf and support vector machine for news classification. In: 2016 IEEE International Conference on Engineering and Technology (ICETECH). IEEE, pp. 112\u2013116","DOI":"10.1109\/ICETECH.2016.7569223"},{"key":"16491_CR6","doi-asserted-by":"crossref","unstructured":"Dandeniya D (2018) An automatic e-news article content extraction and classification. In: 2018 18th International Conference on Advances in ICT for Emerging Regions (ICTer). IEEE, 2018, pp. 196\u2013202","DOI":"10.1109\/ICTER.2018.8615480"},{"key":"16491_CR7","unstructured":"Elghannam F (2019) Text representation and classification based on bi-gram alphabet. Journal of King Saud University-Computer and Information Sciences"},{"key":"16491_CR8","unstructured":"Glorot X, Bordes A, Bengio Y (2011) Domain adaptation for large-scale sentiment classification: A deep learning approach"},{"key":"16491_CR9","doi-asserted-by":"crossref","unstructured":"Gupta RK, Yang Y (2019) Predicting and understanding news social popularity with emotional salience features. In: Proceedings of the 27th ACM International Conference on Multimedia, pp. 139\u2013147","DOI":"10.1145\/3343031.3351048"},{"key":"16491_CR10","doi-asserted-by":"crossref","unstructured":"Haryanto AW, Mawardi EK et\u00a0al. (2018) Influence of word normalization and chi-squared feature selection on support vector machine (svm) text classification. In: 2018 International Seminar on Application for Technology of Information and Communication. IEEE, pp. 229\u2013233","DOI":"10.1109\/ISEMANTIC.2018.8549748"},{"key":"16491_CR11","doi-asserted-by":"publisher","unstructured":"Kadhim AI, Cheah YN, Ahamed NH (2014) Text document preprocessing and dimension reduction techniques for text document clustering. In: 2014 4th International Conference on Artificial Intelligence with Applications in Engineering and Technology. IEEE, p 69\u201373. https:\/\/doi.org\/10.1109\/ICAIET.2014.2","DOI":"10.1109\/ICAIET.2014.2"},{"key":"16491_CR12","doi-asserted-by":"crossref","unstructured":"Karaman Y, Akdeniz F, Sava\u015f BK, Becerikli Y (2023) A comparative analysis of svm, lstm and cnn-rnn models for the bbc news classification. In: Innovations in Smart Cities Applications Volume 6: The Proceedings of the 7th International Conference on Smart City Applications. Springer, p 473\u2013483","DOI":"10.1007\/978-3-031-26852-6_44"},{"issue":"8","key":"16491_CR13","doi-asserted-by":"publisher","first-page":"2788","DOI":"10.3390\/app10082788","volume":"10","author":"M Khalid","year":"2020","unstructured":"Khalid M, Ashraf I, Mehmood A, Ullah S, Ahmad M, Choi GS (2020) Gbsvm: Sentiment classification from unstructured reviews using ensemble classifier. Applied Sciences 10(8):2788","journal-title":"Applied Sciences"},{"key":"16491_CR14","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1016\/j.ins.2018.10.006","volume":"477","author":"D Kim","year":"2019","unstructured":"Kim D, Seo D, Cho S, Kang P (2019) Multi-co-training for document classification using various document representations: Tf-idf, lda, and doc2vec. Information Sciences 477:15\u201329","journal-title":"Information Sciences"},{"key":"16491_CR15","doi-asserted-by":"crossref","unstructured":"Kjaerulff UB, Madsen AL (2008) Bayesian networks and influence diagrams. Springer Science+ Business Media, vol. 200, p. 114, 2008","DOI":"10.1007\/978-0-387-74101-7"},{"key":"16491_CR16","doi-asserted-by":"publisher","first-page":"10333","DOI":"10.1109\/ACCESS.2022.3144659","volume":"10","author":"E Lee","year":"2022","unstructured":"Lee E, Rustam F, Ashraf I, Washington PB, Narra M, Shafique R (2022) Inquest of current situation in afghanistan under taliban rule using sentiment analysis and volume analysis. IEEE Access 10:10333\u201310348","journal-title":"IEEE Access"},{"issue":"3","key":"16491_CR17","first-page":"18","volume":"2","author":"A Liaw","year":"2002","unstructured":"Liaw A, Wiener M et al (2002) Classification and regression by randomforest. R news 2(3):18\u201322","journal-title":"R news"},{"key":"16491_CR18","unstructured":"McCallum A, Nigam K, et\u00a0al. (1998) A comparison of event models for naive bayes text classification. In: AAAI-98 workshop on learning for text categorization, vol. 752, no.\u00a01. Citeseer, pp. 41\u201348"},{"key":"16491_CR19","doi-asserted-by":"crossref","unstructured":"Mehmood A, On BW, Lee I, Ashraf I, Choi GS (2017) Spam comments prediction using stacking with ensemble learning. In: Journal of Physics: Conference Series, vol. 933, no.\u00a01. IOP Publishing, p. 012012","DOI":"10.1088\/1742-6596\/933\/1\/012012"},{"key":"16491_CR20","doi-asserted-by":"crossref","unstructured":"M\u00e9ndez JR, Iglesias EL, Fdez-Riverola F, D\u00edaz F, Corchado JM (2005) Tokenising, stemming and stopword removal on anti-spam filtering domain. In: Conference of the Spanish Association for Artificial Intelligence. Springer, p 449\u2013458","DOI":"10.1007\/11881216_47"},{"key":"16491_CR21","doi-asserted-by":"crossref","unstructured":"Neelakantan A, Shankar J, Passos A, McCallum A (2015) Efficient non-parametric estimation of multiple embeddings per word in vector space. arXiv:1504.06654","DOI":"10.3115\/v1\/D14-1113"},{"issue":"3","key":"16491_CR22","doi-asserted-by":"publisher","DOI":"10.24425\/bpasts.2021.136749","volume":"69","author":"AM Osowska-Kurczab","year":"2021","unstructured":"Osowska-Kurczab AM, Markiewicz T, Dziekiewicz M, Lorent M (2021) Multi-feature ensemble system in the renal tumour classification task. Bulletin of the Polish Academy of Sciences: Technical Sciences 69(3):e136749","journal-title":"Bulletin of the Polish Academy of Sciences: Technical Sciences"},{"issue":"1","key":"16491_CR23","doi-asserted-by":"publisher","first-page":"217","DOI":"10.1080\/01431160412331269698","volume":"26","author":"M Pal","year":"2005","unstructured":"Pal M (2005) Random forest classifier for remote sensing classification. International Journal of Remote Sensing 26(1):217\u2013222","journal-title":"International Journal of Remote Sensing"},{"key":"16491_CR24","unstructured":"Quinlan JR, C4. 5: programs for machine learning. Elsevier, 2014"},{"key":"16491_CR25","doi-asserted-by":"crossref","unstructured":"Rana MI, Khalid S, Akbar MU (2014) News classification based on their headlines: A review. In: 17th IEEE International Multi Topic Conference 2014. IEEE, p 211\u2013216","DOI":"10.1109\/INMIC.2014.7097339"},{"key":"16491_CR26","doi-asserted-by":"crossref","unstructured":"Reshi AA, Rustam F, Aljedaani W, Shafi S, Alhossan A, Alrabiah Z, Ahmad A, Alsuwailem H, Almangour TA, Alshammari MA et\u00a0al. (2022) Covid-19 vaccination-related sentiments analysis: a case study using worldwide twitter dataset. In: Healthcare, vol.\u00a010, no.\u00a03. MDPI, p. 411","DOI":"10.3390\/healthcare10030411"},{"issue":"11","key":"16491_CR27","doi-asserted-by":"publisher","first-page":"1078","DOI":"10.3390\/e21111078","volume":"21","author":"F Rustam","year":"2019","unstructured":"Rustam F, Ashraf I, Mehmood A, Ullah S, Choi GS (2019) Tweets classification on the base of sentiments for us airline companies. Entropy 21(11):1078","journal-title":"Entropy"},{"key":"16491_CR28","doi-asserted-by":"crossref","unstructured":"Rustam F, Mehmood A, Ahmad M, Ullah S, Khan DM, Choi GS (2020) Classification of shopify app user reviews using novel multi text features. EEE Access","DOI":"10.1109\/ACCESS.2020.2972632"},{"key":"16491_CR29","doi-asserted-by":"publisher","unstructured":"Sadeghi D, Shoeibi A, Ghassemi N, Moridian P, Khadem A, Alizadehsani R, Teshnehlab M, Gorriz JM, Khozeimeh F, Zhang YD, Nahavandi S, Acharya UR (2022) An overview of artificial intelligence techniques for diagnosis of schizophrenia based on magnetic resonance imaging modalities: Methods, challenges, and future works. Computers in Biology and Medicine, vol. 146, p. 105554, [Online]. Available: https:\/\/doi.org\/10.1016\/j.compbiomed.2022.105554","DOI":"10.1016\/j.compbiomed.2022.105554"},{"key":"16491_CR30","unstructured":"Salman HA, Obaida TH (2021) Bbc news data classification using na\u00efve bayes based on bag of word. Journal of Hunan University (NaturalSciences), vol.\u00a048, no.\u00a09"},{"key":"16491_CR31","unstructured":"Shoeibi A, Khodatars M, Alizadehsani R, Ghassemi N, Jafari M, Moridian P, Khadem A, Sadeghi D, Hussain S, Zare A, Sani ZA, Bazeli J, Khozeimeh F, Khosravi A, Nahavandi S, Acharya UR, Gorriz JM (2022) Automated detection and forecasting of covid-19 using deep learning techniques: A review"},{"key":"16491_CR32","doi-asserted-by":"publisher","unstructured":"Shoeibi A, Khodatars M, Jafari M, Moridian P, Rezaei M, Alizadehsani R, Khozeimeh F, Gorriz JM, Heras J, Panahiazar M, Nahavandi S, Acharya UR (2021) Applications of deep learning techniques for automated multiple sclerosis detection using magnetic resonance imaging: A review. Computers in Biology and Medicine, vol. 136, p. 104697, [Online]. Available: https:\/\/doi.org\/10.1016\/j.compbiomed.2021.104697","DOI":"10.1016\/j.compbiomed.2021.104697"},{"key":"16491_CR33","doi-asserted-by":"crossref","unstructured":"Tariq S, Akhtar N, Afzal H, Khalid S, Mufti MR, Hussain S, Habib A, Ahmad G (2019) A novel co-training-based approach for the classification of mental illnesses using social media posts. IEEE Access, vol.\u00a07, p 166,165\u2013166,172","DOI":"10.1109\/ACCESS.2019.2953087"},{"key":"16491_CR34","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1016\/j.procs.2017.10.039","volume":"116","author":"R Wongso","year":"2017","unstructured":"Wongso R, Luwinda FA, Trisnajaya BC, Rusli O et al (2017) News article text classification in indonesian language. Procedia Comput Sci 116:137\u2013143","journal-title":"Procedia Comput Sci"},{"issue":"1\u20134","key":"16491_CR35","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1007\/s13042-010-0001-0","volume":"1","author":"Y Zhang","year":"2010","unstructured":"Zhang Y, Jin R, Zhou Z-H (2010) Understanding bag-of-words model: a statistical framework. International Journal of Machine Learning and Cybernetics 1(1\u20134):43\u201352","journal-title":"International Journal of Machine Learning and Cybernetics"},{"key":"16491_CR36","doi-asserted-by":"crossref","unstructured":"Zhu W, Zhang W, Li G-Z, He C, Zhang L (2016) A study of damp-heat syndrome classification using word2vec and tf-idf. In 2016 IEEE International Conference on Bioinformatics and Biomedicine (BIBM). IEEE, pp. 1415\u20131420","DOI":"10.1109\/BIBM.2016.7822730"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-16491-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-023-16491-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-16491-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,8]],"date-time":"2024-03-08T06:35:17Z","timestamp":1709879717000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-023-16491-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,9,15]]},"references-count":36,"journal-issue":{"issue":"11","published-online":{"date-parts":[[2024,3]]}},"alternative-id":["16491"],"URL":"https:\/\/doi.org\/10.1007\/s11042-023-16491-7","relation":{},"ISSN":["1573-7721"],"issn-type":[{"type":"electronic","value":"1573-7721"}],"subject":[],"published":{"date-parts":[[2023,9,15]]},"assertion":[{"value":"17 November 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 May 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 August 2023","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 September 2023","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflicts of interest"}}]}}