{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,20]],"date-time":"2026-04-20T10:31:20Z","timestamp":1776681080278,"version":"3.51.2"},"publisher-location":"Cham","reference-count":47,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030916077","type":"print"},{"value":"9783030916084","type":"electronic"}],"license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-91608-4_20","type":"book-chapter","created":{"date-parts":[[2021,11,23]],"date-time":"2021-11-23T20:05:55Z","timestamp":1637697955000},"page":"196-203","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["New Arabic Medical Dataset for Diseases Classification"],"prefix":"10.1007","author":[{"given":"Jaafar","family":"Hammoud","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Aleksandra","family":"Vatian","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Natalia","family":"Dobrenko","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nikolai","family":"Vedernikov","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Anatoly","family":"Shalyto","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Natalia","family":"Gusarova","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,11,23]]},"reference":[{"key":"20_CR1","unstructured":"Li, Q., et al.: A text classification survey: from shallow to deep learning. arXiv preprint arXiv:2008.00364 (2020)"},{"issue":"3","key":"20_CR2","doi-asserted-by":"publisher","first-page":"71","DOI":"10.1186\/s12911-019-0781-4","volume":"19","author":"L Yao","year":"2019","unstructured":"Yao, L., Mao, C., Luo, Y.: Clinical text classification with rule-based features and knowledge-guided convolutional neural networks. BMC Med. Inform. Decis. Mak. 19(3), 71 (2019)","journal-title":"BMC Med. Inform. Decis. Mak."},{"key":"20_CR3","doi-asserted-by":"publisher","unstructured":"Suzdaltseva, M., et al.: De-identification of medical information for forming multimodal datasets to train neural networks. In: Proceedings of the 7th International Conference on Information and Communication Technologies for Ageing Well and E-Health, pp. 163\u2013170 (2021). https:\/\/doi.org\/10.5220\/0010406001630170","DOI":"10.5220\/0010406001630170"},{"key":"20_CR4","unstructured":"Hammoud, J., Dobrenko, N., Gusarova, N.: Named entity recognition and information extraction for Arabic medical text. In: Multi Conference on Computer Science and Information Systems, MCCSIS 2020-Proceedings of the International Conference on e-Health, pp. 121\u2013127 (2020)"},{"key":"20_CR5","doi-asserted-by":"crossref","unstructured":"Alalyani, N., Marie-Sainte, S.L.: NADA: new Arabic dataset for text classification. Int. J. Adv. Comput. Sci. Appl. 9(9) (2018)","DOI":"10.14569\/IJACSA.2018.090928"},{"issue":"1\u20134","key":"20_CR6","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1007\/s13042-010-0001-0","volume":"1","author":"Y Zhang","year":"2010","unstructured":"Zhang, Y., Jin, R., Zhou, Z.H.: Understanding bag-of-words model: a statistical framework. Int. J. Mach. Learn. Cybern. 1(1\u20134), 43\u201352 (2010)","journal-title":"Int. J. Mach. Learn. Cybern."},{"key":"20_CR7","doi-asserted-by":"crossref","unstructured":"Pennington, J., Socher, R., Manning, C.D.: Glove: global vectors for word representation. In: Proceedings of the 2014 conference on empirical methods in natural language processing (EMNLP), pp. 1532\u20131543, Oct 2014","DOI":"10.3115\/v1\/D14-1162"},{"key":"20_CR8","unstructured":"Mikolov, T., Chen, K., Corrado, G., Dean, J.: Efficient estimation of word representations in vector space. arXiv preprint arXiv:1301.3781 (2013)"},{"key":"20_CR9","unstructured":"Cavnar, W.B., Trenkle, J.M.: N-gram-based text categorization. In: Proceedings of SDAIR-94, 3rd Annual Symposium on Document Analysis and Information Retrieval, vol. 161175, Apr 1994"},{"key":"20_CR10","doi-asserted-by":"crossref","unstructured":"Term frequency by inverse document frequency. In: Encyclopedia of Database Systems, p. 3035 (2009)","DOI":"10.1007\/978-0-387-39940-9_3784"},{"key":"20_CR11","doi-asserted-by":"crossref","unstructured":"Zhang, M.L., Zhang, K.: Multi-label learning by exploiting label dependency. In: Proceedings of the 16th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 999\u20131008, July 2010","DOI":"10.1145\/1835804.1835930"},{"key":"20_CR12","doi-asserted-by":"crossref","unstructured":"van den Bosch, A.: Hidden Markov models. In: Encyclopedia of Machine Learning and Data Mining, pp. 609\u2013611 (2017)","DOI":"10.1007\/978-1-4899-7687-1_124"},{"issue":"3","key":"20_CR13","doi-asserted-by":"publisher","first-page":"404","DOI":"10.1145\/321075.321084","volume":"8","author":"ME Maron","year":"1961","unstructured":"Maron, M.E.: Automatic indexing: an experimental inquiry. J. ACM (JACM) 8(3), 404\u2013417 (1961)","journal-title":"J. ACM (JACM)"},{"key":"20_CR14","doi-asserted-by":"crossref","unstructured":"O'Donnell, M.: Cataloging and classification: an introduction. Lois Mai Chan. Lanham, MD: Scarecrow Press, p. 580, 2007. ISBN 0-8108-6000-7. Tech. Serv. Q. 26(1), 86\u201387 (2008)","DOI":"10.1080\/07317130802225670"},{"issue":"1","key":"20_CR15","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1109\/TIT.1967.1053964","volume":"13","author":"T Cover","year":"1967","unstructured":"Cover, T., Hart, P.: Nearest neighbor pattern classification. IEEE Trans. Inf. Theory 13(1), 21\u201327 (1967)","journal-title":"IEEE Trans. Inf. Theory"},{"issue":"1","key":"20_CR16","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13326-016-0073-1","volume":"7","author":"K Dram\u00e9","year":"2016","unstructured":"Dram\u00e9, K., Mougin, F., Diallo, G.: Large scale biomedical texts classification: a kNN and an ESA-based approaches. J. Biomed. Semant. 7(1), 1\u201312 (2016)","journal-title":"J. Biomed. Semant."},{"key":"20_CR17","doi-asserted-by":"crossref","unstructured":"Cortes, C., Vapnik, V.: Support-vector Networks Machine learning, vol. 20, pp. 237\u2013297. Kluwer Academic Publisher, Boston, MA (1995)","DOI":"10.1007\/BF00994018"},{"issue":"5","key":"20_CR18","doi-asserted-by":"publisher","first-page":"850","DOI":"10.1136\/amiajnl-2013-002411","volume":"21","author":"DDA Bui","year":"2014","unstructured":"Bui, D.D.A., Zeng-Treitler, Q.: Learning regular expressions for clinical text classification. J. Am. Med. Inform. Assoc. 21(5), 850\u2013857 (2014)","journal-title":"J. Am. Med. Inform. Assoc."},{"issue":"1","key":"20_CR19","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12911-019-0825-9","volume":"19","author":"CC Chern","year":"2019","unstructured":"Chern, C.C., Chen, Y.J., Hsiao, B.: Decision tree\u2013based classifier in providing telehealth service. BMC Med. Inform. Decis. Mak. 19(1), 1\u201315 (2019)","journal-title":"BMC Med. Inform. Decis. Mak."},{"issue":"3","key":"20_CR20","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3439726","volume":"54","author":"S Minaee","year":"2021","unstructured":"Minaee, S., Kalchbrenner, N., Cambria, E., Nikzad, N., Chenaghlu, M., Gao, J.: Deep learning\u2013based text classification: a comprehensive review. ACM Comput. Surv. (CSUR) 54(3), 1\u201340 (2021)","journal-title":"ACM Comput. Surv. (CSUR)"},{"key":"20_CR21","doi-asserted-by":"crossref","unstructured":"Tai, K.S., Socher, R., Manning, C.D.: Improved semantic representations from tree-structured long short-term memory networks. arXiv preprint arXiv:1503.00075 (2015)","DOI":"10.3115\/v1\/P15-1150"},{"key":"20_CR22","doi-asserted-by":"crossref","unstructured":"Liu, P., Qiu, X., Chen, X., Wu, S., Huang, X.J.: Multi-timescale long short-term memory neural network for modelling sentences and documents. In: Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing, pp. 2326\u20132335, Sept 2015","DOI":"10.18653\/v1\/D15-1280"},{"key":"20_CR23","unstructured":"Zhou, P., Qi, Z., Zheng, S., Xu, J., Bao, H., Xu, B.: Text classification improved by integrating bidirectional LSTM with two-dimensional max pooling. arXiv preprint arXiv:1611.06639 (2016)"},{"key":"20_CR24","doi-asserted-by":"crossref","unstructured":"Conneau, A., Schwenk, H., Barrault, L., Lecun, Y.: Very deep convolutional networks for text classification. arXiv preprint arXiv:1606.01781 (2016)","DOI":"10.18653\/v1\/E17-1104"},{"key":"20_CR25","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556 (2014)"},{"key":"20_CR26","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"20_CR27","doi-asserted-by":"crossref","unstructured":"Mou, L., et al.: Natural language inference by tree-based convolution and heuristic matching. arXiv preprint arXiv:1512.08422 (2015)","DOI":"10.18653\/v1\/P16-2022"},{"key":"20_CR28","doi-asserted-by":"crossref","unstructured":"Karimi, S., Dai, X., Hassanzadeh, H., Nguyen, A.: Automatic diagnosis coding of radiology reports: a comparison of deep learning and conventional classification methods. In: BioNLP 2017, pp. 328\u2013332, Aug 2017","DOI":"10.18653\/v1\/W17-2342"},{"issue":"12","key":"20_CR29","doi-asserted-by":"publisher","first-page":"i70","DOI":"10.1093\/bioinformatics\/btw294","volume":"32","author":"S Peng","year":"2016","unstructured":"Peng, S., You, R., Wang, H., Zhai, C., Mamitsuka, H., Zhu, S.: DeepMeSH: deep semantic representation for improving large-scale MeSH indexing. Bioinformatics 32(12), i70\u2013i79 (2016)","journal-title":"Bioinformatics"},{"key":"20_CR30","doi-asserted-by":"crossref","unstructured":"Rios, A., Kavuluru, R.: Convolutional neural networks for biomedical text classification: application in indexing biomedical articles. In: Proceedings of the 6th ACM Conference on Bioinformatics, Computational Biology and Health Informatics, pp. 258\u2013267, Sept 2015","DOI":"10.1145\/2808719.2808746"},{"key":"20_CR31","first-page":"246","volume":"235","author":"M Hughes","year":"2017","unstructured":"Hughes, M., Li, I., Kotoulas, S., Suzumura, T.: Medical text classification using convolutional neural networks. Stud. Health Technol. Inform. 235, 246\u2013250 (2017)","journal-title":"Stud. Health Technol. Inform."},{"key":"20_CR32","unstructured":"Vaswani, A., et al.: Attention is all you need. arXiv preprint arXiv:1706.03762 (2017)"},{"key":"20_CR33","unstructured":"Devlin, J., Chang, M.W., Lee, K., Toutanova, K.: Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805 (2018)"},{"key":"20_CR34","unstructured":"Hammoud, J., Eisab, A., Dobrenkoa, N., Gusarovaa, N.: Using a new nonlinear gradient method for solving large scale convex optimization problems with an application on Arabic medical text. arXiv preprint arXiv:2106.04383 (2021)"},{"key":"20_CR35","unstructured":"Radford, A., Narasimhan, K., Salimans, T., Sutskever, I.: Improving language understanding by generative pre-training (2018)"},{"issue":"8","key":"20_CR36","first-page":"9","volume":"1","author":"A Radford","year":"2019","unstructured":"Radford, A., Wu, J., Child, R., Luan, D., Amodei, D., Sutskever, I.: Language models are unsupervised multitask learners. OpenAI Blog 1(8), 9 (2019)","journal-title":"OpenAI Blog"},{"key":"20_CR37","unstructured":"Liu, Y., et al.: Roberta: A robustly optimized BERT pretraining approach. arXiv preprint arXiv:1907.11692 (2019)"},{"key":"20_CR38","unstructured":"Lan, Z., Chen, M., Goodman, S., Gimpel, K., Sharma, P., Soricut, R.: Albert: a lite bert for self-supervised learning of language representations. arXiv preprint arXiv:1909.11942 (2019)"},{"issue":"3","key":"20_CR39","first-page":"320","volume":"32","author":"SL Marie-Sainte","year":"2020","unstructured":"Marie-Sainte, S.L., Alalyani, N.: Firefly algorithm based feature selection for Arabic text classification. J. King Saud Univ. Comput. Inf. Sci. 32(3), 320\u2013328 (2020)","journal-title":"J. King Saud Univ. Comput. Inf. Sci."},{"key":"20_CR40","unstructured":"Saad, M.K., Ashour, W.M.: OSAC: open source Arabic corpora. In: 6th ArchEng International Symposiums, EEECS, vol. 10 (2010)"},{"key":"20_CR41","doi-asserted-by":"crossref","unstructured":"Zhu, Y., et al.: Aligning books and movies: towards story-like visual explanations by watching movies and reading books. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 19\u201327 (2015)","DOI":"10.1109\/ICCV.2015.11"},{"key":"20_CR42","unstructured":"Antoun, W., Baly, F., Hajj, H.: Arabert: transformer-based model for Arabic language understanding. arXiv preprint arXiv:2003.00104 (2020)"},{"key":"20_CR43","unstructured":"El-Khair, I.A.: 1.5 billion words Arabic corpus. arXiv preprint arXiv:1611.04033 (2016)"},{"key":"20_CR44","doi-asserted-by":"crossref","unstructured":"Zeroual, I., Goldhahn, D., Eckart, T., Lakhouaja, A.: OSIAN: Open source international Arabic news corpus-preparation and integration into the CLARIN-infrastructure. In: Proceedings of the Fourth Arabic Natural Language Processing Workshop, pp. 175\u2013182, Aug 2019","DOI":"10.18653\/v1\/W19-4619"},{"key":"20_CR45","doi-asserted-by":"crossref","unstructured":"Boudjellal, N., et al.: ABioNER: a BERT-based model for Arabic biomedical named-entity recognition. Complexity (2021)","DOI":"10.1155\/2021\/6633213"},{"key":"20_CR46","unstructured":"WHO EMRO: EMHJ home. East. Mediterr. Health J. 27 (2021). http:\/\/www.emro.who.int\/emhjournal\/eastern-mediterranean-health-journal\/home.html"},{"key":"20_CR47","unstructured":"Adhikari, A., Ram, A., Tang, R., Lin, J.: Docbert: Bert for document classification. arXiv preprint arXiv:1904.08398 (2019)"}],"container-title":["Lecture Notes in Computer Science","Intelligent Data Engineering and Automated Learning \u2013 IDEAL 2021"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-91608-4_20","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,12]],"date-time":"2024-03-12T15:48:53Z","timestamp":1710258533000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-91608-4_20"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"ISBN":["9783030916077","9783030916084"],"references-count":47,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-91608-4_20","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021]]},"assertion":[{"value":"23 November 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"IDEAL","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Intelligent Data Engineering and Automated Learning","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Manchester","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"United Kingdom","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"25 November 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 November 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ideal2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/ideal-conf.com\/ideal2021","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"EasyChair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"85","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"61","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"72% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2.8","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2.3","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"The conference took place virtually due to the COVID-19 pandemic","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}