{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T12:43:34Z","timestamp":1740141814848,"version":"3.37.3"},"reference-count":89,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2023,8,5]],"date-time":"2023-08-05T00:00:00Z","timestamp":1691193600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,8,5]],"date-time":"2023-08-05T00:00:00Z","timestamp":1691193600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["IJDAR"],"published-print":{"date-parts":[[2024,3]]},"DOI":"10.1007\/s10032-023-00446-7","type":"journal-article","created":{"date-parts":[[2023,8,5]],"date-time":"2023-08-05T11:01:36Z","timestamp":1691233296000},"page":"73-95","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["A multifaceted evaluation of representation of graphemes for practically effective Bangla OCR"],"prefix":"10.1007","volume":"27","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9525-7196","authenticated-orcid":false,"given":"Koushik","family":"Roy","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1481-6994","authenticated-orcid":false,"given":"Md Sazzad","family":"Hossain","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1646-7804","authenticated-orcid":false,"given":"Pritom Kumar","family":"Saha","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0357-7636","authenticated-orcid":false,"given":"Shadman","family":"Rohan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9978-6442","authenticated-orcid":false,"given":"Imranul","family":"Ashrafi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3830-8759","authenticated-orcid":false,"given":"Ifty Mohammad","family":"Rezwan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8670-7124","authenticated-orcid":false,"given":"Fuad","family":"Rahman","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0447-4217","authenticated-orcid":false,"given":"B. M. Mainul","family":"Hossain","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5983-6775","authenticated-orcid":false,"given":"Ahmedul","family":"Kabir","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7661-3570","authenticated-orcid":false,"given":"Nabeel","family":"Mohammed","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,8,5]]},"reference":[{"issue":"1","key":"446_CR1","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1109\/MASSP.1986.1165342","volume":"3","author":"L Rabiner","year":"1986","unstructured":"Rabiner, L., Juang, B.: An introduction to hidden Markov models. IEEE ASSP Mag. 3(1), 4\u201316 (1986)","journal-title":"IEEE ASSP Mag."},{"key":"446_CR2","series-title":"Wiley Series in Probability and Statistics","doi-asserted-by":"publisher","DOI":"10.1002\/9780470035948","volume-title":"Bayesian Statistical Modelling","author":"P Congdon","year":"2006","unstructured":"Congdon, P.: Bayesian Statistical Modelling. Wiley Series in Probability and Statistics, Wiley (2006). https:\/\/doi.org\/10.1002\/9780470035948"},{"key":"446_CR3","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556 (2014)"},{"key":"446_CR4","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"issue":"12","key":"446_CR5","doi-asserted-by":"publisher","first-page":"2552","DOI":"10.1109\/TPAMI.2014.2339814","volume":"36","author":"J Almaz\u00e1n","year":"2014","unstructured":"Almaz\u00e1n, J., Gordo, A., Forn\u00e9s, A., Valveny, E.: Word spotting and recognition with embedded attributes. IEEE Trans. Pattern Anal. Mach. Intell. 36(12), 2552\u20132566 (2014)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"446_CR6","unstructured":"Jaderberg, M., Simonyan, K., Vedaldi, A., Zisserman, A.: Synthetic data and artificial neural networks for natural scene text recognition. arXiv preprint arXiv:1406.2227 (2014)"},{"key":"446_CR7","doi-asserted-by":"crossref","unstructured":"Feng, X., Yao, H., Zhang, S.: Focal CTC loss for Chinese optical character recognition on unbalanced datasets. Complexity 2019 (2019)","DOI":"10.1155\/2019\/9345861"},{"key":"446_CR8","unstructured":"Kang, L., Riba, P., Rusi\u00f1ol, M., Forn\u00e9s, A., Villegas, M.: Pay attention to what you read: non-recurrent handwritten text-line recognition. arXiv preprint arXiv:2005.13044 (2020)"},{"issue":"1","key":"446_CR9","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11263-015-0823-z","volume":"116","author":"M Jaderberg","year":"2016","unstructured":"Jaderberg, M., Simonyan, K., Vedaldi, A., Zisserman, A.: Reading text in the wild with convolutional neural networks. Int. J. Comput. Vis. 116(1), 1\u201320 (2016). https:\/\/doi.org\/10.1007\/s11263-015-0823-z","journal-title":"Int. J. Comput. Vis."},{"issue":"11","key":"446_CR10","doi-asserted-by":"publisher","first-page":"2298","DOI":"10.1109\/TPAMI.2016.2646371","volume":"39","author":"B Shi","year":"2016","unstructured":"Shi, B., Bai, X., Yao, C.: An end-to-end trainable neural network for image-based sequence recognition and its application to scene text recognition. IEEE Trans. Pattern Anal. Mach. Intell. 39(11), 2298\u20132304 (2016)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"446_CR11","doi-asserted-by":"crossref","unstructured":"Hu, W., Cai, X., Hou, J., Yi, S., Lin, Z.: GTC: Guided training of CTC towards efficient and accurate scene text recognition. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 34, pp. 11005\u201311012 (2020)","DOI":"10.1609\/aaai.v34i07.6735"},{"key":"446_CR12","doi-asserted-by":"publisher","first-page":"149","DOI":"10.1007\/978-981-16-1092-9_13","volume-title":"Comput. Vis. Image Process.","author":"MJR Rifat","year":"2021","unstructured":"Rifat, M.J.R., Banik, M., Hasan, N., Nahar, J., Rahman, F.: A novel machine annotated balanced Bangla OCR corpus. In: Singh, S.K., Roy, P., Raman, B., Nagabhushan, P. (eds.) Comput. Vis. Image Process., pp. 149\u2013160. Springer, Singapore (2021)"},{"issue":"3","key":"446_CR13","doi-asserted-by":"publisher","first-page":"431","DOI":"10.1007\/s10044-011-0237-7","volume":"16","author":"M Anthimopoulos","year":"2013","unstructured":"Anthimopoulos, M., Gatos, B., Pratikakis, I.: Detection of artificial and scene text in images and video frames. Pattern Anal. Appl. 16(3), 431\u2013446 (2013)","journal-title":"Pattern Anal. Appl."},{"key":"446_CR14","doi-asserted-by":"crossref","unstructured":"Chen, H., Tsai, S.S., Schroth, G., Chen, D.M., Grzeszczuk, R., Girod, B.: Robust text detection in natural images with edge-enhanced maximally stable extremal regions. In: 2011 18th IEEE International Conference on Image Processing, pp. 2609\u20132612 (2011). IEEE","DOI":"10.1109\/ICIP.2011.6116200"},{"key":"446_CR15","doi-asserted-by":"crossref","unstructured":"Epshtein, B., Ofek, E., Wexler, Y.: Detecting text in natural scenes with stroke width transform. In: 2010 IEEE Computer Society Conference on Computer Vision and Pattern Recognition, pp. 2963\u20132970 (2010). IEEE","DOI":"10.1109\/CVPR.2010.5540041"},{"key":"446_CR16","doi-asserted-by":"crossref","unstructured":"Huang, W., Qiao, Y., Tang, X.: Robust scene text detection with convolution neural network induced MSER trees. In: European Conference on Computer Vision, pp. 497\u2013511 (2014). Springer","DOI":"10.1007\/978-3-319-10593-2_33"},{"key":"446_CR17","unstructured":"Alsharif, O., Pineau, J.: End-to-end text recognition with hybrid hmm maxout models. arXiv preprint arXiv:1310.1811 (2013)"},{"key":"446_CR18","doi-asserted-by":"crossref","unstructured":"Gordo, A.: Supervised mid-level features for word image representation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2956\u20132964 (2015)","DOI":"10.1109\/CVPR.2015.7298914"},{"key":"446_CR19","doi-asserted-by":"crossref","unstructured":"Neumann, L., Matas, J.: A method for text localization and recognition in real-world images. In: Asian Conference on Computer Vision, pp. 770\u2013783 (2010). Springer","DOI":"10.1007\/978-3-642-19318-7_60"},{"key":"446_CR20","doi-asserted-by":"crossref","unstructured":"Mishra, A., Alahari, K., Jawahar, C.: Image retrieval using textual cues. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 3040\u20133047 (2013)","DOI":"10.1109\/ICCV.2013.378"},{"key":"446_CR21","doi-asserted-by":"crossref","unstructured":"Smith, R.: An overview of the Tesseract OCR engine. In: Ninth International Conference on Document Analysis and Recognition (ICDAR 2007), vol. 2, pp. 629\u2013633 (2007). IEEE","DOI":"10.1109\/ICDAR.2007.4376991"},{"key":"446_CR22","doi-asserted-by":"crossref","unstructured":"Shi, B., Wang, X., Lyu, P., Yao, C., Bai, X.: Robust scene text recognition with automatic rectification. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4168\u20134176 (2016)","DOI":"10.1109\/CVPR.2016.452"},{"issue":"8","key":"446_CR23","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S., Schmidhuber, J.: Long short-term memory. Neural Comput. 9(8), 1735\u20131780 (1997)","journal-title":"Neural Comput."},{"key":"446_CR24","doi-asserted-by":"crossref","unstructured":"Karatzas, D., Shafait, F., Uchida, S., Iwamura, M., i Bigorda, L.G., Mestre, S.R., Mas, J., Mota, D.F., Almazan, J.A., De\u00a0Las\u00a0Heras, L.P.: ICDAR 2013 robust reading competition. In: 2013 12th International Conference on Document Analysis and Recognition, pp. 1484\u20131493 (2013). IEEE","DOI":"10.1109\/ICDAR.2013.221"},{"key":"446_CR25","doi-asserted-by":"crossref","unstructured":"Baek, J., Kim, G., Lee, J., Park, S., Han, D., Yun, S., Oh, S.J., Lee, H.: What is wrong with scene text recognition model comparisons? Dataset and model analysis. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (ICCV) (2019)","DOI":"10.1109\/ICCV.2019.00481"},{"key":"446_CR26","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A.N., Kaiser, L., Polosukhin, I.: Attention is all you need. arXiv preprint arXiv:1706.03762 (2017)"},{"key":"446_CR27","doi-asserted-by":"crossref","unstructured":"Graves, A., Fern\u00e1ndez, S., Gomez, F., Schmidhuber, J.: Connectionist temporal classification: labelling unsegmented sequence data with recurrent neural networks. In: Proceedings of the 23rd International Conference on Machine Learning, pp. 369\u2013376 (2006)","DOI":"10.1145\/1143844.1143891"},{"issue":"9","key":"446_CR28","doi-asserted-by":"publisher","first-page":"2035","DOI":"10.1109\/TPAMI.2018.2848939","volume":"41","author":"B Shi","year":"2019","unstructured":"Shi, B., Yang, M., Wang, X., Lyu, P., Yao, C., Bai, X.: ASTER: an attentional scene text recognizer with flexible rectification. IEEE Trans. Pattern Anal. Mach. Intell. 41(9), 2035\u20132048 (2019). https:\/\/doi.org\/10.1109\/TPAMI.2018.2848939","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"446_CR29","doi-asserted-by":"publisher","unstructured":"Cheng, Z., Bai, F., Xu, Y., Zheng, G., Pu, S., Zhou, S.: Focusing attention: towards accurate text recognition in natural images. In: 2017 IEEE International Conference on Computer Vision (ICCV), pp. 5086\u20135094 (2017). https:\/\/doi.org\/10.1109\/ICCV.2017.543","DOI":"10.1109\/ICCV.2017.543"},{"key":"446_CR30","doi-asserted-by":"publisher","unstructured":"Litman, R., Anschel, O., Tsiper, S., Litman, R., Mazor, S., Manmatha, R.: Scatter: selective context attentional scene text recognizer. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 11959\u201311969 (2020). https:\/\/doi.org\/10.1109\/CVPR42600.2020.01198","DOI":"10.1109\/CVPR42600.2020.01198"},{"key":"446_CR31","doi-asserted-by":"crossref","unstructured":"Yu, D., Li, X., Zhang, C., Liu, T., Han, J., Liu, J., Ding, E.: Towards accurate scene text recognition with semantic reasoning networks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12113\u201312122 (2020)","DOI":"10.1109\/CVPR42600.2020.01213"},{"key":"446_CR32","doi-asserted-by":"crossref","unstructured":"Karatzas, D., Gomez-Bigorda, L., Nicolaou, A., Ghosh, S., Bagdanov, A., Iwamura, M., Matas, J., Neumann, L., Chandrasekhar, V.R., Lu, S., et al.: ICDAR 2015 competition on robust reading. In: 2015 13th International Conference on Document Analysis and Recognition (ICDAR), pp. 1156\u20131160 (2015). IEEE","DOI":"10.1109\/ICDAR.2015.7333942"},{"key":"446_CR33","unstructured":"Feng, X., Yao, H., Qi, Y., Zhang, J., Zhang, S.: Scene text recognition via transformer. arXiv preprint arXiv:2003.08077 (2020)"},{"key":"446_CR34","doi-asserted-by":"crossref","unstructured":"Atienza, R.: Vision transformer for fast and efficient scene text recognition. In: Document Analysis and Recognition\u2013ICDAR 2021: 16th International Conference, Lausanne, Switzerland, September 5\u201310, 2021, Proceedings, Part I, vol. 16, pp. 319\u2013334 (2021). Springer","DOI":"10.1007\/978-3-030-86549-8_21"},{"key":"446_CR35","unstructured":"Wu, J., Peng, Y., Zhang, S., Qi, W., Zhang, J.: Masked vision-language transformers for scene text recognition. arXiv preprint arXiv:2211.04785 (2022)"},{"key":"446_CR36","doi-asserted-by":"crossref","unstructured":"Wang, P., Da, C., Yao, C.: Multi-granularity prediction for scene text recognition. In: Computer Vision\u2014ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23\u201327, 2022, Proceedings, Part XXVIII, pp. 339\u2013355 (2022). Springer","DOI":"10.1007\/978-3-031-19815-1_20"},{"key":"446_CR37","doi-asserted-by":"crossref","unstructured":"Xie, X., Fu, L., Zhang, Z., Wang, Z., Bai, X.: Toward understanding wordart: corner-guided transformer for scene text recognition. In: Computer Vision\u2013ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23\u201327, 2022, Proceedings, Part XXVIII, pp. 303\u2013321 (2022). Springer","DOI":"10.1007\/978-3-031-19815-1_18"},{"key":"446_CR38","unstructured":"Aberdam, A., Ganz, R., Mazor, S., Litman, R.: Multimodal semi-supervised learning for text recognition. arXiv preprint arXiv:2205.03873 (2022)"},{"key":"446_CR39","doi-asserted-by":"crossref","unstructured":"Yang, M., Liao, M., Lu, P., Wang, J., Zhu, S., Luo, H., Tian, Q., Bai, X.: Reading and writing: discriminative and generative modeling for self-supervised text recognition. In: Proceedings of the 30th ACM International Conference on Multimedia, pp. 4214\u20134223 (2022)","DOI":"10.1145\/3503161.3547784"},{"key":"446_CR40","doi-asserted-by":"crossref","unstructured":"Chu, X., Wang, Y.: IterVM: iterative vision modeling module for scene text recognition. In: 2022 26th International Conference on Pattern Recognition (ICPR), pp. 1393\u20131399 (2022). IEEE","DOI":"10.1109\/ICPR56361.2022.9956029"},{"key":"446_CR41","doi-asserted-by":"crossref","unstructured":"Du, Y., Chen, Z., Jia, C., Yin, X., Zheng, T., Li, C., Du, Y., Jiang, Y.-G.: Svtr: scene text recognition with a single visual model. arXiv preprint arXiv:2205.00159 (2022)","DOI":"10.24963\/ijcai.2022\/124"},{"key":"446_CR42","doi-asserted-by":"crossref","unstructured":"Zheng, C., Li, H., Rhee, S.-M., Han, S., Han, J.-J., Wang, P.: Pushing the performance limit of scene text recognizer without human annotation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 14116\u201314125 (2022)","DOI":"10.1109\/CVPR52688.2022.01372"},{"key":"446_CR43","doi-asserted-by":"crossref","unstructured":"Chammas, E., Mokbel, C., Likforman-Sulem, L.: Handwriting recognition of historical documents with few labeled data. In: 2018 13th IAPR International Workshop on Document Analysis Systems (DAS), pp. 43\u201348 (2018). IEEE","DOI":"10.1109\/DAS.2018.15"},{"key":"446_CR44","doi-asserted-by":"crossref","unstructured":"Ki\u0161\u0161, M., Hradi\u0161, M., Bene\u0161, K., Buchal, P., Kula, M.: SoftCTC\u2014Semi-Supervised Learning for Text Recognition using Soft Pseudo-labels. arXiv (2022). arXiv:2212.02135","DOI":"10.1007\/s10032-023-00452-9"},{"key":"446_CR45","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107482","volume":"108","author":"M Yousef","year":"2020","unstructured":"Yousef, M., Hussain, K.F., Mohammed, U.S.: Accurate, data-efficient, unconstrained text recognition with convolutional neural networks. Pattern Recogn. 108, 107482 (2020). https:\/\/doi.org\/10.1016\/j.patcog.2020.107482","journal-title":"Pattern Recogn."},{"key":"446_CR46","doi-asserted-by":"publisher","unstructured":"Maillette\u00a0de Buy\u00a0Wenniger, G., Schomaker, L., Way, A.: No padding please: efficient neural handwriting recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR), pp. 355\u2013362 (2019). https:\/\/doi.org\/10.1109\/ICDAR.2019.00064","DOI":"10.1109\/ICDAR.2019.00064"},{"key":"446_CR47","doi-asserted-by":"publisher","first-page":"507","DOI":"10.1007\/978-3-031-06555-2_34","volume-title":"Document Analysis Systems","author":"D Kass","year":"2022","unstructured":"Kass, D., Vats, E.: AttentionHTR: handwritten text recognition based on attention encoder\u2013decoder networks. In: Uchida, S., Barney, E., Eglin, V. (eds.) Document Analysis Systems, pp. 507\u2013522. Springer, Cham (2022)"},{"key":"446_CR48","doi-asserted-by":"publisher","unstructured":"Fogel, S., Averbuch-Elor, H., Cohen, S., Mazor, S., Litman, R.: Scrabblegan: Semi-supervised varying length handwritten text generation. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 4323\u20134332 (2020). https:\/\/doi.org\/10.1109\/CVPR42600.2020.00438","DOI":"10.1109\/CVPR42600.2020.00438"},{"key":"446_CR49","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1016\/j.patrec.2022.06.003","volume":"160","author":"MA Souibgui","year":"2022","unstructured":"Souibgui, M.A., Forn\u00e9s, A., Kessentini, Y., Megyesi, B.: Few shots are all you need: a progressive learning approach for low resource handwritten text recognition. Pattern Recogn. Lett. 160, 43\u201349 (2022). https:\/\/doi.org\/10.1016\/j.patrec.2022.06.003","journal-title":"Pattern Recogn. Lett."},{"issue":"4","key":"446_CR50","first-page":"395","volume":"6","author":"A Rahman","year":"1998","unstructured":"Rahman, A., Kaykobad, M.: A complete Bengali OCR: a novel hybrid approach to handwritten Bengali character recognition. J. Comput. Inf. Technol. 6(4), 395\u2013413 (1998)","journal-title":"J. Comput. Inf. Technol."},{"key":"446_CR51","doi-asserted-by":"publisher","unstructured":"Pal, U., Chaudhuri, B.B.: OCR in Bangla: an Indo-Bangladeshi language. In: Proceedings of the 12th IAPR International Conference on Pattern Recognition, Vol. 3\u2014Conference C: Signal Processing (Cat. No.94CH3440-5), vol. 2, pp. 269\u20132732 (1994). https:\/\/doi.org\/10.1109\/ICPR.1994.576917","DOI":"10.1109\/ICPR.1994.576917"},{"issue":"1","key":"446_CR52","first-page":"1","volume":"4","author":"M Sattar","year":"1989","unstructured":"Sattar, M., Rahman, S.: An experimental investigation on Bangla character recognition system. Bangladesh Comput. Soc. J. 4(1), 1\u20134 (1989)","journal-title":"Bangladesh Comput. Soc. J."},{"issue":"14","key":"446_CR53","doi-asserted-by":"publisher","first-page":"1208","DOI":"10.1049\/el:19970848","volume":"33","author":"AFR Rahman","year":"1997","unstructured":"Rahman, A.F.R., Fairhurst, M.: Multi-prototype classification: improved modelling of the variability of handwritten data using statistical clustering algorithms. Electron. Lett. 33(14), 1208\u20131210 (1997)","journal-title":"Electron. Lett."},{"key":"446_CR54","unstructured":"Pal, U.: On the development of an optical character recognition (OCR) system for printed Bangla script. PhD thesis, Indian Statistical Institute, Calcutta (1997)"},{"issue":"5","key":"446_CR55","doi-asserted-by":"publisher","first-page":"531","DOI":"10.1016\/S0031-3203(97)00078-2","volume":"31","author":"B Chaudhuri","year":"1998","unstructured":"Chaudhuri, B., Pal, U.: A complete printed Bangla OCR system. Pattern Recogn. 31(5), 531\u2013549 (1998)","journal-title":"Pattern Recogn."},{"issue":"8","key":"446_CR56","doi-asserted-by":"publisher","first-page":"781","DOI":"10.1016\/S0167-8655(97)00078-0","volume":"18","author":"AFR Rahman","year":"1997","unstructured":"Rahman, A.F.R., Fairhurst, M.C.: A new hybrid approach in combining multiple experts to recognise handwritten numerals. Pattern Recogn. Lett. 18(8), 781\u2013790 (1997)","journal-title":"Pattern Recogn. Lett."},{"issue":"5","key":"446_CR57","doi-asserted-by":"publisher","first-page":"997","DOI":"10.1016\/S0031-3203(01)00089-9","volume":"35","author":"AFR Rahman","year":"2002","unstructured":"Rahman, A.F.R., Rahman, R., Fairhurst, M.C.: Recognition of handwritten Bengali characters: a novel multistage approach. Pattern Recogn. 35(5), 997\u20131006 (2002)","journal-title":"Pattern Recogn."},{"key":"446_CR58","unstructured":"Mahmud, J.U., Raihan, M.F., Rahman, C.M.: A complete OCR system for continuous Bengali characters. In: TENCON 2003. Conference on Convergent Technologies for Asia-Pacific Region, vol. 4, pp. 1372\u20131376 (2003). IEEE"},{"key":"446_CR59","unstructured":"Kamruzzaman, J., Aziz, S.: Improved machine recognition for Bangla characters. In: International Conference on Electrical and Computer Engineering 2004, pp. 557\u2013560 (2004). ICECE 2004 Conference Secretariat, Bangladesh of Engineering and Technology"},{"issue":"01","key":"446_CR60","first-page":"30","volume":"1","author":"MM Alam","year":"2010","unstructured":"Alam, M.M., Kashem, M.A.: A complete Bangla OCR system for printed characters. JCIT 1(01), 30\u201335 (2010)","journal-title":"JCIT"},{"key":"446_CR61","unstructured":"Ahmed, S., Kashem, M.A.: Enhancing the character segmentation accuracy of Bangla OCR using BPNN. Int. J. Sci. Res. (IJSR) ISSN (Online), 2319\u20137064 (2013)"},{"key":"446_CR62","unstructured":"Chowdhury, A.A., Ahmed, E., Ahmed, S., Hossain, S., Rahman, C.M.: Optical character recognition of Bangla characters using neural network: a better approach. In: 2nd ICEE (2002)"},{"key":"446_CR63","unstructured":"Ahmed, S., Sakib, A.N., Ishtiaque\u00a0Mahmud, M., Belali, H., Rahman, S.: The anatomy of Bangla OCR system for printed texts using back propagation neural network. Glob. J. Comput. Sci. Technol. (2012)"},{"key":"446_CR64","doi-asserted-by":"crossref","unstructured":"Afroge, S., Ahmed, B., Hossain, A.: Bangla optical character recognition through segmentation using curvature distance and multilayer perceptron algorithm. In: 2017 International Conference on Electrical, Computer and Communication Engineering (ECCE), pp. 253\u2013257 (2017). IEEE","DOI":"10.1109\/ECACE.2017.7912914"},{"key":"446_CR65","doi-asserted-by":"crossref","unstructured":"Hossain, S.A., Tabassum, T.: Neural net based complete character recognition scheme for Bangla printed text books. In: 16th International Conference on Computer and Information Technology, pp. 71\u201375 (2014). IEEE","DOI":"10.1109\/ICCITechn.2014.6997336"},{"key":"446_CR66","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1016\/j.jvcir.2017.11.016","volume":"50","author":"R Pramanik","year":"2018","unstructured":"Pramanik, R., Bag, S.: Shape decomposition-based handwritten compound character recognition for Bangla OCR. J. Vis. Commun. Image Represent. 50, 123\u2013134 (2018)","journal-title":"J. Vis. Commun. Image Represent."},{"key":"446_CR67","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1016\/j.patcog.2019.03.030","volume":"92","author":"R Ghosh","year":"2019","unstructured":"Ghosh, R., Vamshi, C., Kumar, P.: RNN based online handwritten word recognition in Devanagari and Bengali scripts using horizontal zoning. Pattern Recogn. 92, 203\u2013218 (2019)","journal-title":"Pattern Recogn."},{"key":"446_CR68","doi-asserted-by":"crossref","unstructured":"Purkaystha, B., Datta, T., Islam, M.S.: Bengali handwritten character recognition using deep convolutional neural network. In: 2017 20th International Conference of Computer and Information Technology (ICCIT), pp. 1\u20135 (2017). IEEE","DOI":"10.1109\/ICCITECHN.2017.8281853"},{"key":"446_CR69","doi-asserted-by":"publisher","first-page":"10631","DOI":"10.1007\/s11042-022-12070-4","volume":"81","author":"MS Islam","year":"2022","unstructured":"Islam, M.S., Rahman, M.M., Rahman, M.H., Rivolta, M.W., Aktaruzzaman, M.: Ratnet: a deep learning model for Bengali handwritten characters recognition. Multimed. Tools Appl. 81, 10631\u201310651 (2022). https:\/\/doi.org\/10.1007\/s11042-022-12070-4","journal-title":"Multimed. Tools Appl."},{"key":"446_CR70","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1007\/978-981-15-6318-8_8","volume-title":"Machine Learning, Image Processing, Network Security and Data Sciences","author":"S Maity","year":"2020","unstructured":"Maity, S., Dey, A., Chowdhury, A., Banerjee, A.: Handwritten Bengali character recognition using deep convolution neural network. In: Bhattacharjee, A., Borgohain, S.K., Soni, B., Verma, G., Gao, X.-Z. (eds.) Machine Learning, Image Processing, Network Security and Data Sciences, pp. 84\u201392. Springer, Singapore (2020)"},{"key":"446_CR71","unstructured":"Roy, A.: AKHCRNet: Bengali Handwritten Character Recognition Using Deep Learning (2020)"},{"key":"446_CR72","doi-asserted-by":"crossref","unstructured":"Sharif, S., Mohammed, N., Momen, S., Mansoor, N.: Classification of Bangla compound characters using a HOG-CNN hybrid model. In: Proceedings of the International Conference on Computing and Communication Systems, pp. 403\u2013411 (2018). Springer","DOI":"10.1007\/978-981-10-6890-4_39"},{"key":"446_CR73","doi-asserted-by":"crossref","unstructured":"Hasan, M.J., Wahid, M.F., Alom, M.S.: Bangla compound character recognition by combining deep convolutional neural network with bidirectional long short-term memory. In: 2019 4th International Conference on Electrical Information and Communication Technology (EICT), pp. 1\u20134 (2019). IEEE","DOI":"10.1109\/EICT48899.2019.9068817"},{"key":"446_CR74","unstructured":"Paul, D., Chaudhuri, B.B.: A BLSTM network for printed Bengali OCR system with high accuracy. arXiv preprint arXiv:1908.08674 (2019)"},{"key":"446_CR75","unstructured":"Glorot, X., Bengio, Y.: Understanding the difficulty of training deep feedforward neural networks. In: Proceedings of the Thirteenth International Conference on Artificial Intelligence and Statistics, pp. 249\u2013256 (2010). JMLR Workshop and Conference Proceedings"},{"key":"446_CR76","doi-asserted-by":"publisher","unstructured":"Rahman, M.A., Tabassum, N., Paul, M., Pal, R., Islam, M.K.: BN-HTRd: A Benchmark Dataset for Document Level Offline Bangla Handwritten Text Recognition (HTR) and Line Segmentation. arXiv (2022). https:\/\/doi.org\/10.48550\/ARXIV.2206.08977. https:\/\/arxiv.org\/abs\/2206.08977","DOI":"10.48550\/ARXIV.2206.08977"},{"key":"446_CR77","doi-asserted-by":"publisher","DOI":"10.1016\/j.dib.2020.106633","volume":"34","author":"MF Mridha","year":"2021","unstructured":"Mridha, M.F., Ohi, A.Q., Ali, M.A., Emon, M.I., Kabir, M.M.: Banglawriting: a multi-purpose offline Bangla handwriting dataset. Data Brief. 34, 106633 (2021). https:\/\/doi.org\/10.1016\/j.dib.2020.106633","journal-title":"Data Brief."},{"key":"446_CR78","doi-asserted-by":"crossref","unstructured":"Banik, M., Rifat, M.J.R., Nahar, J., Hasan, N., Rahman, F.: Okkhor: a synthetic corpus of Bangla printed characters. In: Arai, K., Kapoor, S., Bhatia, R. (eds.) Proceedings of the Future Technologies Conference (FTC) 2020, vol. 1, pp. 693\u2013711. Springer, Cham (2021)","DOI":"10.1007\/978-3-030-63128-4_53"},{"key":"446_CR79","unstructured":"Roark, B., Wolf-Sonkin, L., Kirov, C., Mielke, S.J., Johny, C., Demirsahin, I., Hall, K.: Processing South Asian languages written in the Latin script: the Dakshina dataset. In: Proceedings of the 12th Language Resources and Evaluation Conference, pp. 2413\u20132423. European Language Resources Association, Marseille, France (2020). https:\/\/aclanthology.org\/2020.lrec-1.294"},{"issue":"1","key":"446_CR80","first-page":"78","volume":"21","author":"MA Al Mumin","year":"2014","unstructured":"Al Mumin, M.A., Shoeb, A.A.M., Selim, M.R., Iqbal, M.Z.: Sumono: a representative modern Bengali corpus. SUST J. Sci. Technol. 21(1), 78\u201386 (2014)","journal-title":"SUST J. Sci. Technol."},{"key":"446_CR81","doi-asserted-by":"publisher","unstructured":"Biswas, E.: Bangla Largest Newspaper Dataset. Kaggle (2021). https:\/\/doi.org\/10.34740\/KAGGLE\/DSV\/1857507. https:\/\/www.kaggle.com\/dsv\/1857507","DOI":"10.34740\/KAGGLE\/DSV\/1857507"},{"key":"446_CR82","doi-asserted-by":"publisher","unstructured":"Ahmed, M.F., Mahmud, Z., Biash, Z.T., Ryen, A.A.N., Hossain, A., Ashraf, F.B.: Bangla Online Comments Dataset. Mendeley Data (2021). https:\/\/doi.org\/10.17632\/9xjx8twk8p.1. https:\/\/data.mendeley.com\/datasets\/9xjx8twk8p\/1","DOI":"10.17632\/9xjx8twk8p.1"},{"key":"446_CR83","unstructured":"Farahmand, A., Sarrafzadeh, H., Shanbehzadeh, J.: Document image noises and removal methods (2013)"},{"key":"446_CR84","doi-asserted-by":"publisher","unstructured":"Lee, C.-Y., Osindero, S.: Recursive recurrent nets with attention modeling for OCR in the wild. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 2231\u20132239 (2016). https:\/\/doi.org\/10.1109\/CVPR.2016.245","DOI":"10.1109\/CVPR.2016.245"},{"issue":"1","key":"446_CR85","doi-asserted-by":"publisher","first-page":"168","DOI":"10.1145\/321796.321811","volume":"21","author":"RA Wagner","year":"1974","unstructured":"Wagner, R.A., Fischer, M.J.: The string-to-string correction problem. J. ACM (JACM) 21(1), 168\u2013173 (1974)","journal-title":"J. ACM (JACM)"},{"key":"446_CR86","doi-asserted-by":"publisher","DOI":"10.3390\/info11020125","author":"A Buslaev","year":"2020","unstructured":"Buslaev, A., Iglovikov, V.I., Khvedchenya, E., Parinov, A., Druzhinin, M., Kalinin, A.A.: Albumentations: fast and flexible image augmentations. Information (2020). https:\/\/doi.org\/10.3390\/info11020125","journal-title":"Information"},{"key":"446_CR87","doi-asserted-by":"publisher","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Delving deep into rectifiers: surpassing human-level performance on imagenet classification. In: 2015 IEEE International Conference on Computer Vision (ICCV), pp. 1026\u20131034. IEEE Computer Society, Los Alamitos, CA, USA (2015). https:\/\/doi.org\/10.1109\/ICCV.2015.123","DOI":"10.1109\/ICCV.2015.123"},{"key":"446_CR88","unstructured":"Loshchilov, I., Hutter, F.: SGDR: Stochastic Gradient Descent with Warm Restarts (2017)"},{"key":"446_CR89","unstructured":"Paszke, A., Gross, S., Massa, F., Lerer, A., Bradbury, J., Chanan, G., Killeen, T., Lin, Z., Gimelshein, N., Antiga, L., Desmaison, A., Kopf, A., Yang, E., DeVito, Z., Raison, M., Tejani, A., Chilamkurthy, S., Steiner, B., Fang, L., Bai, J., Chintala, S.: Pytorch: an imperative style, high-performance deep learning library. In: Advances in Neural Information Processing Systems 32, pp. 8024\u20138035. Curran Associates, Inc. (2019). http:\/\/papers.neurips.cc\/paper\/9015-pytorch-an-imperative-style-high-performance-deep-learning-library.pdf"}],"container-title":["International Journal on Document Analysis and Recognition (IJDAR)"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10032-023-00446-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10032-023-00446-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10032-023-00446-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,25]],"date-time":"2024-10-25T19:22:18Z","timestamp":1729884138000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10032-023-00446-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,8,5]]},"references-count":89,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2024,3]]}},"alternative-id":["446"],"URL":"https:\/\/doi.org\/10.1007\/s10032-023-00446-7","relation":{},"ISSN":["1433-2833","1433-2825"],"issn-type":[{"type":"print","value":"1433-2833"},{"type":"electronic","value":"1433-2825"}],"subject":[],"published":{"date-parts":[[2023,8,5]]},"assertion":[{"value":"4 August 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 March 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 June 2023","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 August 2023","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}