{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,10]],"date-time":"2025-12-10T12:48:02Z","timestamp":1765370882281,"version":"3.46.0"},"reference-count":23,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2025,9,26]],"date-time":"2025-09-26T00:00:00Z","timestamp":1758844800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,9,26]],"date-time":"2025-09-26T00:00:00Z","timestamp":1758844800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Iran J Comput Sci"],"published-print":{"date-parts":[[2025,12]]},"DOI":"10.1007\/s42044-025-00332-x","type":"journal-article","created":{"date-parts":[[2025,9,26]],"date-time":"2025-09-26T11:27:35Z","timestamp":1758886055000},"page":"2949-2963","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Multi-label imbalanced text handling using ensemble methodology with application to biomedical data classification"],"prefix":"10.1007","volume":"8","author":[{"given":"Subhajit","family":"Ghosh","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sanidhya","family":"Gupta","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sourav","family":"Bhattacharyya","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Avik Kumar","family":"Das","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Apurba","family":"Nandi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ardhendu","family":"Sarkar","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Partha Sarathi","family":"Samanta","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chantri","family":"Polprasert","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,9,26]]},"reference":[{"key":"332_CR1","unstructured":"Gao, X., Xie, D., Zhang, Y., Wang, Z., He, C., Yin, H., Zhang, W.: A comprehensive survey on imbalanced data learning. arXiv preprint arXiv:2502.08960 (2025)"},{"key":"332_CR2","doi-asserted-by":"publisher","first-page":"105151","DOI":"10.1016\/j.engappai.2022.105151","volume":"115","author":"MA Ganaie","year":"2022","unstructured":"Ganaie, M.A., Hu, M., Malik, A.K., Tanveer, M., Suganthan, P.N.: Ensemble deep learning: a review. Eng. Appl. Artif. Intell. 115, 105151 (2022)","journal-title":"Eng. Appl. Artif. Intell."},{"issue":"1","key":"332_CR3","doi-asserted-by":"publisher","first-page":"61","DOI":"10.1186\/s40537-025-01108-7","volume":"12","author":"K Taha","year":"2025","unstructured":"Taha, K.: Machine learning in biomedical and health big data: a comprehensive survey with empirical and experimental insights. J. Big Data 12(1), 61 (2025)","journal-title":"J. Big Data"},{"issue":"10","key":"332_CR4","doi-asserted-by":"publisher","first-page":"1338","DOI":"10.1109\/TKDE.2006.162","volume":"18","author":"M-L Zhang","year":"2006","unstructured":"Zhang, M.-L., Zhou, Z.-H.: Multilabel neural networks with applications to functional genomics and text categorization. IEEE Trans. Knowl. Data Eng. 18(10), 1338\u20131351 (2006)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"332_CR5","doi-asserted-by":"crossref","unstructured":"Nam, J., Kim, J., Loza\u00a0Menc\u00eda, E., Gurevych, I., F\u00fcrnkranz, J.: Large-scale multi-label text classification\u2014revisiting neural networks. In: Machine Learning and Knowledge Discovery in Databases: European Conference, ECML PKDD 2014, Nancy, France, September 15\u201319, 2014. Proceedings, Part II 14, pp. 437\u2013452. Springer, Berlin (2014)","DOI":"10.1007\/978-3-662-44851-9_28"},{"key":"332_CR6","doi-asserted-by":"publisher","unstructured":"Zhang, N., Lei, D., Zhao, J.F.: An improved Adagrad gradient descent optimization algorithm. In: 2018 Chinese Automation Congress (CAC), pp. 2359\u20132362 (2018). https:\/\/doi.org\/10.1109\/CAC.2018.8623271","DOI":"10.1109\/CAC.2018.8623271"},{"key":"332_CR7","doi-asserted-by":"crossref","unstructured":"Tsoumakas, G., Katakis, I.: Multi-label classification: an overview. In: Data Warehousing and Mining: Concepts, Methodologies, Tools, and Applications, pp. 64\u201374 (2008)","DOI":"10.4018\/978-1-59904-951-9.ch006"},{"key":"332_CR8","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1007\/s10994-011-5256-5","volume":"85","author":"J Read","year":"2011","unstructured":"Read, J., Pfahringer, B., Holmes, G., Frank, E.: Classifier chains for multi-label classification. Mach. Learn. 85, 333\u2013359 (2011)","journal-title":"Mach. Learn."},{"key":"332_CR9","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1016\/j.neucom.2014.08.091","volume":"163","author":"F Charte","year":"2015","unstructured":"Charte, F., Rivera, A.J., Del Jesus, M.J., Herrera, F.: Addressing imbalance in multilabel classification: measures and random resampling algorithms. Neurocomputing 163, 3\u201316 (2015)","journal-title":"Neurocomputing"},{"key":"332_CR10","doi-asserted-by":"publisher","first-page":"107687","DOI":"10.1016\/j.asoc.2021.107687","volume":"111","author":"I Singh","year":"2021","unstructured":"Singh, I., Kumar, N., Srinivasa, K., Maini, S., Ahuja, U., Jain, S.: A multi-level classification and modified PSO clustering based ensemble approach for credit scoring. Appl. Soft Comput. 111, 107687 (2021)","journal-title":"Appl. Soft Comput."},{"issue":"1","key":"332_CR11","doi-asserted-by":"publisher","first-page":"21631","DOI":"10.1038\/s41598-025-05791-7","volume":"15","author":"SF Taskiran","year":"2025","unstructured":"Taskiran, S.F., Turkoglu, B., Kaya, E., Asuroglu, T.: A comprehensive evaluation of oversampling techniques for enhancing text classification performance. Sci. Rep. 15(1), 21631 (2025)","journal-title":"Sci. Rep."},{"key":"332_CR12","doi-asserted-by":"crossref","unstructured":"Bari, H.: Contextual sentence embedding using base difference procedure (BDP) vectorization. In: 2025 IEEE International Students\u2019 Conference on Electrical, Electronics and Computer Science (SCEECS), pp. 1\u20136. IEEE (2025)","DOI":"10.1109\/SCEECS64059.2025.10940513"},{"key":"332_CR13","unstructured":"Amini, S.: Transforming dementia diagnosis and prognosis through AI. PhD thesis, Boston University (2025)"},{"key":"332_CR14","doi-asserted-by":"crossref","unstructured":"Litoriya, A., Kumar, S., Behera, A.K., Alsamhi, S.H.: DistilBERT meets diagnosis: multi-class disease classification from noisy medical transcriptions. In: 2025 5th International Conference on Emerging Smart Technologies and Applications (eSmarTA), pp. 1\u20138. IEEE (2025)","DOI":"10.1109\/eSmarTA66764.2025.11132131"},{"key":"332_CR15","doi-asserted-by":"crossref","unstructured":"Comito, C., Forestiero, A., Macr\u00ec, D., Metlichin, E., Giusti, G.D., Ramacciati, N.: Comparative analysis of ai algorithms on real medical data for chronic pain detection. International Journal of Medical Informatics, 106002 (2025)","DOI":"10.1016\/j.ijmedinf.2025.106002"},{"issue":"1","key":"332_CR16","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/sdata.2016.35","volume":"3","author":"AE Johnson","year":"2016","unstructured":"Johnson, A.E., Pollard, T.J., Shen, L., Lehman, L.-W.H., Feng, M., Ghassemi, M., Moody, B., Szolovits, P., Anthony Celi, L., Mark, R.G.: MIMIC-III, a freely accessible critical care database. Sci. Data 3(1), 1\u20139 (2016)","journal-title":"Sci. Data"},{"key":"332_CR17","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12859-015-0564-6","volume":"16","author":"G Tsatsaronis","year":"2015","unstructured":"Tsatsaronis, G., Balikas, G., Malakasiotis, P., Partalas, I., Zschunke, M., Alvers, M.R., Weissenborn, D., Krithara, A., Petridis, S., Polychronopoulos, D., et al.: An overview of the BIOASQ large-scale biomedical semantic indexing and question answering competition. BMC Bioinform. 16, 1\u201328 (2015)","journal-title":"BMC Bioinform."},{"key":"332_CR18","unstructured":"Dernoncourt, F., Lee, J.Y.: PubMed 200k RCT: a dataset for sequential sentence classification in medical abstracts (2017). arXiv preprint. arXiv:1710.06071"},{"issue":"7138","key":"332_CR19","doi-asserted-by":"publisher","first-page":"1166","DOI":"10.1136\/bmj.316.7138.1166","volume":"316","author":"D Woods","year":"1998","unstructured":"Woods, D., Trewheellar, K.: Medline and Embase complement each other in literature searches. BMJ: Br. Med. J. 316(7138), 1166 (1998)","journal-title":"BMJ: Br. Med. J."},{"key":"332_CR20","doi-asserted-by":"publisher","first-page":"61","DOI":"10.1016\/j.ejca.2018.07.137","volume":"103","author":"E Paillaud","year":"2018","unstructured":"Paillaud, E., Soubeyran, P., Caillet, P., Cudennec, T., Brain, E., Terret, C., Etchepare, F., Mourey, L., Aparicio, T., Pamoukdjian, F., et al.: Multidisciplinary development of the geriatric core dataset for clinical research in older patients with cancer: a French initiative with international survey. Eur. J. Cancer 103, 61\u201368 (2018)","journal-title":"Eur. J. Cancer"},{"issue":"4","key":"332_CR21","first-page":"215","volume":"3","author":"HL Gope","year":"2014","unstructured":"Gope, H.L., Das, P.K., Islam, M.J., Seddiqui, M.H.: Medical document classification from OHSUMED dataset. IJCSN Int. J. Comput. Sci. Netw. 3(4), 215\u2013219 (2014)","journal-title":"IJCSN Int. J. Comput. Sci. Netw."},{"issue":"1","key":"332_CR22","doi-asserted-by":"publisher","first-page":"909","DOI":"10.1038\/s41597-023-02814-8","volume":"10","author":"Z Zhao","year":"2023","unstructured":"Zhao, Z., Jin, Q., Chen, F., Peng, T., Yu, S.: A large-scale dataset of patient summaries for retrieval-based clinical decision support systems. Sci. Data 10(1), 909 (2023)","journal-title":"Sci. Data"},{"key":"332_CR23","unstructured":"Wang, L.L., Lo, K., Chandrasekhar, Y., Reas, R., Yang, J., Burdick, D., Eide, D., Funk, K., Katsis, Y., Kinney, R.M., Li, Y., Liu, Z., Merrill, W., Mooney, P., Murdick, D.A., Rishi, D., Sheehan, J., Shen, Z., Stilson, B., Wade, A.D., Wang, K., Wang, N.X.R., Wilhelm, C., Xie, B., Raymond, D.M., Weld, D.S., Etzioni, O., Kohlmeier, S.: CORD-19: the COVID-19 open research dataset. In: Verspoor, K., Cohen, K.B., Dredze, M., Ferrara, E., May, J., Munro, R., Paris, C., Wallace, B. (eds.) Proceedings of the 1st Workshop on NLP for COVID-19 at ACL 2020. Association for Computational Linguistics, Online (2020). https:\/\/aclanthology.org\/2020.nlpcovid19-acl.1\/"}],"container-title":["Iran Journal of Computer Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42044-025-00332-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s42044-025-00332-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42044-025-00332-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,10]],"date-time":"2025-12-10T09:10:22Z","timestamp":1765357822000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s42044-025-00332-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,26]]},"references-count":23,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2025,12]]}},"alternative-id":["332"],"URL":"https:\/\/doi.org\/10.1007\/s42044-025-00332-x","relation":{},"ISSN":["2520-8438","2520-8446"],"issn-type":[{"type":"print","value":"2520-8438"},{"type":"electronic","value":"2520-8446"}],"subject":[],"published":{"date-parts":[[2025,9,26]]},"assertion":[{"value":"11 April 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 September 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 September 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"All authors who contributed provided their consent for publication.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}}]}}