{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T07:27:33Z","timestamp":1740122853778,"version":"3.37.3"},"reference-count":62,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2022,2,28]],"date-time":"2022-02-28T00:00:00Z","timestamp":1646006400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,2,28]],"date-time":"2022-02-28T00:00:00Z","timestamp":1646006400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001409","name":"Department of Science and Technology, Ministry of Science and Technology","doi-asserted-by":"publisher","award":["EMR\/2016\/007213","EMR\/2016\/007213","EMR\/2016\/007213"],"award-info":[{"award-number":["EMR\/2016\/007213","EMR\/2016\/007213","EMR\/2016\/007213"]}],"id":[{"id":"10.13039\/501100001409","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001407","name":"Department of Biotechnology , Ministry of Science and Technology","doi-asserted-by":"publisher","award":["BT\/PR16356\/BID\/7\/596\/2016"],"award-info":[{"award-number":["BT\/PR16356\/BID\/7\/596\/2016"]}],"id":[{"id":"10.13039\/501100001407","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2022,5]]},"DOI":"10.1007\/s11042-022-12596-7","type":"journal-article","created":{"date-parts":[[2022,2,28]],"date-time":"2022-02-28T16:03:15Z","timestamp":1646064195000},"page":"15367-15394","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["How to handle bi\/tri-lingual Indic texts in a single image? A new dataset of natural scene and born-digital images"],"prefix":"10.1007","volume":"81","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2723-1434","authenticated-orcid":false,"given":"Neelotpal","family":"Chakraborty","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Arkoprobho","family":"Mitra","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ayush","family":"Choudhury","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ayatullah Faruk","family":"Mollah","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Subhadip","family":"Basu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ram","family":"Sarkar","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,2,28]]},"reference":[{"unstructured":"Abadi, M., Barham, P., Chen, J., Chen, Z., Davis, A., Dean, J., ... & Zheng, X. (2016). Tensorflow: A system for large-scale machine learning. In 12th {USENIX} symposium on operating systems design and implementation ({OSDI} 16) (pp. 265\u2013283).","key":"12596_CR1"},{"doi-asserted-by":"crossref","unstructured":"Agrawal A, Mukherjee P, Srivastava S, & Lall B (2018). Enhanced characterness for text detection in the wild. In proceedings of 2nd international conference on Computer Vision & Image Processing (pp. 359\u2013369). Springer, Singapore","key":"12596_CR2","DOI":"10.1007\/978-981-10-7895-8_28"},{"doi-asserted-by":"crossref","unstructured":"Baur C, Albarqouni S, Navab N (2017) Semi-supervised deep learning for fully convolutional networks. In international conference on medical image computing and computer-assisted intervention (pp. 311-319). Springer, Cham.","key":"12596_CR3","DOI":"10.1007\/978-3-319-66179-7_36"},{"key":"12596_CR4","doi-asserted-by":"publisher","first-page":"172","DOI":"10.1016\/j.patcog.2018.07.034","volume":"85","author":"AK Bhunia","year":"2019","unstructured":"Bhunia AK, Konwer A, Bhunia AK, Bhowmick A, Roy PP, Pal U (2019) Script identification in natural scene image and video frames using an attention based convolutional-LSTM network. Pattern Recogn 85:172\u2013184","journal-title":"Pattern Recogn"},{"doi-asserted-by":"crossref","unstructured":"Bu\u0161ta M, Patel Y, Matas J (2018, December) E2e-mlt-an unconstrained end-to-end method for multi-language scene text. In Asian conference on computer vision (pp. 127-143). Springer, Cham.","key":"12596_CR5","DOI":"10.1007\/978-3-030-21074-8_11"},{"key":"12596_CR6","doi-asserted-by":"publisher","first-page":"7997","DOI":"10.1007\/s12652-020-02528-4","volume":"12","author":"N Chakraborty","year":"2020","unstructured":"Chakraborty N, Kundu S, Paul S, Mollah AF, Basu S, Sarkar R (2020) Language identification from multi-lingual scene text images: a CNN based classifier ensemble approach. J Ambient Intell Humaniz Comput 12:7997\u20138008","journal-title":"J Ambient Intell Humaniz Comput"},{"issue":"1","key":"12596_CR7","doi-asserted-by":"publisher","first-page":"323","DOI":"10.1007\/s11042-020-09728-2","volume":"80","author":"N Chakraborty","year":"2021","unstructured":"Chakraborty N, Chatterjee A, Singh PK, Mollah AF, Sarkar R (2021) Application of daisy descriptor for language identification in the wild. Multimed Tools Appl 80(1):323\u2013344","journal-title":"Multimed Tools Appl"},{"doi-asserted-by":"crossref","unstructured":"Chen H, Tsai SS, Schroth G, Chen DM, Grzeszczuk R, Girod B (2011) Robust text detection in natural images with edge-enhanced maximally stable extremal regions. In 2011 18th IEEE international conference on image processing (pp. 2609-2612). IEEE.","key":"12596_CR8","DOI":"10.1109\/ICIP.2011.6116200"},{"doi-asserted-by":"crossref","unstructured":"Cheng C, Huang Q, Bai X, Feng B, Liu W (2019, September) Patch aggregator for scene text script identification. In 2019 international conference on document analysis and recognition (ICDAR) (pp. 1077-1083). IEEE.","key":"12596_CR9","DOI":"10.1109\/ICDAR.2019.00175"},{"issue":"1","key":"12596_CR10","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12864-019-6413-7","volume":"21","author":"D Chicco","year":"2020","unstructured":"Chicco D, Jurman G (2020) The advantages of the Matthews correlation coefficient (MCC) over F1 score and accuracy in binary classification evaluation. BMC Genomics 21(1):1\u201313","journal-title":"BMC Genomics"},{"doi-asserted-by":"crossref","unstructured":"Chollet F (2017) Xception: deep learning with depthwise separable convolutions. In proceedings of the IEEE conference on computer vision and pattern recognition (pp. 1251-1258).","key":"12596_CR11","DOI":"10.1109\/CVPR.2017.195"},{"doi-asserted-by":"crossref","unstructured":"Deng D, Liu H, Li X, Cai D (2018) Pixellink: detecting scene text via instance segmentation. In proceedings of the AAAI conference on artificial intelligence (Vol. 32, no. 1).","key":"12596_CR12","DOI":"10.1609\/aaai.v32i1.12269"},{"issue":"3","key":"12596_CR13","doi-asserted-by":"publisher","first-page":"31","DOI":"10.4018\/IJCVIP.2020070103","volume":"10","author":"D Dhar","year":"2020","unstructured":"Dhar D, Chakraborty N, Choudhury S, Paul A, Mollah AF, Basu S, Sarkar R (2020) Multilingual scene text detection using gradient morphology. Int J Comput Vision Image Process (IJCVIP) 10(3):31\u201343","journal-title":"Int J Comput Vision Image Process (IJCVIP)"},{"doi-asserted-by":"crossref","unstructured":"Doulamis N, Doulamis A (2014) Semi-supervised deep learning for object tracking and classification. In 2014 IEEE international conference on image processing (ICIP) (pp. 848-852). IEEE.","key":"12596_CR14","DOI":"10.1109\/ICIP.2014.7025170"},{"issue":"5","key":"12596_CR15","doi-asserted-by":"publisher","first-page":"7609","DOI":"10.1007\/s11042-020-09785-7","volume":"80","author":"IN Dutta","year":"2021","unstructured":"Dutta IN, Chakraborty N, Mollah AF, Basu S, Sarkar R (2021) BOB: a bi-level overlapped binning procedure for scene word binarization. Multimed Tools Appl 80(5):7609\u20137635","journal-title":"Multimed Tools Appl"},{"doi-asserted-by":"crossref","unstructured":"Epshtein B, Ofek E, Wexler Y (2010) Detecting text in natural scenes with stroke width transform. In 2010 IEEE computer society conference on computer vision and pattern recognition (pp. 2963-2970). IEEE.","key":"12596_CR16","DOI":"10.1109\/CVPR.2010.5540041"},{"key":"12596_CR17","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1016\/j.neucom.2018.03.041","volume":"304","author":"K Fan","year":"2018","unstructured":"Fan K, Baek SJ (2018) A robust proposal generation method for text lines in natural scene images. Neurocomputing 304:47\u201363","journal-title":"Neurocomputing"},{"doi-asserted-by":"crossref","unstructured":"Fujii Y, Driesen K, Baccash J, Hurst A, Popat AC (2017, November) Sequence-to-label script identification for multilingual ocr. In 2017 14th IAPR international conference on document analysis and recognition (ICDAR) (Vol. 1, pp. 161-168). IEEE.","key":"12596_CR18","DOI":"10.1109\/ICDAR.2017.35"},{"doi-asserted-by":"crossref","unstructured":"Gomez L, Karatzas D (2016) A fine-grained approach to scene text script identification. In 2016 12th IAPR workshop on document analysis systems (DAS) (pp. 192-197). IEEE.","key":"12596_CR19","DOI":"10.1109\/DAS.2016.64"},{"key":"12596_CR20","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1016\/j.patcog.2017.01.032","volume":"67","author":"L Gomez","year":"2017","unstructured":"Gomez L, Nicolaou A, Karatzas D (2017) Improving patch-based scene text script identification with ensembles of conjoined networks. Pattern Recogn 67:85\u201396","journal-title":"Pattern Recogn"},{"key":"12596_CR21","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1016\/j.neucom.2015.09.116","volume":"187","author":"Y Guo","year":"2016","unstructured":"Guo Y, Liu Y, Oerlemans A, Lao S, Wu S, Lew MS (2016) Deep learning for visual understanding: a review. Neurocomputing 187:27\u201348","journal-title":"Neurocomputing"},{"doi-asserted-by":"crossref","unstructured":"Haifeng D, Siqi H (2020, September) Natural scene text detection based on YOLO V2 network model. In journal of physics: conference series (Vol. 1634, no. 1, p. 012013). IOP publishing.","key":"12596_CR22","DOI":"10.1088\/1742-6596\/1634\/1\/012013"},{"doi-asserted-by":"crossref","unstructured":"Huang G, Liu Z, Van Der Maaten L, Weinberger KQ (2017) Densely connected convolutional networks. In proceedings of the IEEE conference on computer vision and pattern recognition (pp. 4700-4708).","key":"12596_CR23","DOI":"10.1109\/CVPR.2017.243"},{"doi-asserted-by":"crossref","unstructured":"Huang G, Liu S, Van der Maaten L, Weinberger KQ (2018) Condensenet: an efficient densenet using learned group convolutions. In proceedings of the IEEE conference on computer vision and pattern recognition (pp. 2752-2761).","key":"12596_CR24","DOI":"10.1109\/CVPR.2018.00291"},{"doi-asserted-by":"crossref","unstructured":"Jiang Y, Zhu X, Wang X, Yang S, Li W, Wang H, ... & Luo Z (2017). R2cnn: rotational region cnn for orientation robust scene text detection. arXiv preprint arXiv:1706.09579.","key":"12596_CR25","DOI":"10.1109\/ICPR.2018.8545598"},{"issue":"1","key":"12596_CR26","doi-asserted-by":"publisher","first-page":"77","DOI":"10.1007\/s40010-017-0478-y","volume":"89","author":"SF Joan","year":"2019","unstructured":"Joan SF, Valli S (2019) A survey on text information extraction from born-digital and scene text images. Proceed National Acad Sci, India Section A: Phys Sci 89(1):77\u2013101","journal-title":"Proceed National Acad Sci, India Section A: Phys Sci"},{"issue":"1","key":"12596_CR27","doi-asserted-by":"publisher","first-page":"78","DOI":"10.4218\/etrij.11.1510.0029","volume":"33","author":"J Jung","year":"2011","unstructured":"Jung J, Lee S, Cho MS, Kim JH (2011) Touch TT: scene text extractor using touchscreen interface. ETRI J 33(1):78\u201388","journal-title":"ETRI J"},{"doi-asserted-by":"crossref","unstructured":"Karatzas D, Mestre SR, Mas J, Nourbakhsh F, Roy PP (2011) ICDAR 2011 robust reading competition-challenge 1: reading text in born-digital images (web and email). In 2011 international conference on document analysis and recognition (pp. 1485-1490). IEEE.","key":"12596_CR28","DOI":"10.1109\/ICDAR.2011.295"},{"doi-asserted-by":"crossref","unstructured":"Karatzas D, Shafait F, Uchida S, Iwamura M, i Bigorda LG, Mestre, S. R., ... & De Las Heras LP (2013). ICDAR 2013 robust reading competition. In 2013 12th International Conference on Document Analysis and Recognition (pp. 1484\u20131493). IEEE.","key":"12596_CR29","DOI":"10.1109\/ICDAR.2013.221"},{"doi-asserted-by":"crossref","unstructured":"Karatzas, D., Gomez-Bigorda, L., Nicolaou, A., Ghosh, S., Bagdanov, A., Iwamura, M., ... & Valveny E (2015). ICDAR 2015 competition on robust reading. In 2015 13th International Conference on Document Analysis and Recognition (ICDAR) (pp. 1156\u20131160). IEEE.","key":"12596_CR30","DOI":"10.1109\/ICDAR.2015.7333942"},{"issue":"22","key":"12596_CR31","doi-asserted-by":"publisher","first-page":"32159","DOI":"10.1007\/s11042-019-08028-8","volume":"78","author":"T Khan","year":"2019","unstructured":"Khan T, Mollah AF (2019) AUTNT-A component level dataset for text non-text classification and benchmarking with novel script invariant feature descriptors and D-CNN. Multimed Tools Appl 78(22):32159\u201332186","journal-title":"Multimed Tools Appl"},{"key":"12596_CR32","doi-asserted-by":"publisher","first-page":"3239","DOI":"10.1007\/s10462-020-09930-6","volume":"54","author":"T Khan","year":"2021","unstructured":"Khan T, Sarkar R, Mollah AF (2021) Deep learning approaches to scene text detection: a comprehensive review. Artif Intell Rev 54:3239\u20133298","journal-title":"Artif Intell Rev"},{"unstructured":"Kingma DP, Ba J (2014) Adam: a method for stochastic optimization. arXiv preprint arXiv:1412.6980.","key":"12596_CR33"},{"doi-asserted-by":"crossref","unstructured":"Liao M, Shi B, Bai X, Wang X, Liu W (2017) February. A fast text detector with a single deep neural network. In Thirty-first AAAI conference on artificial intelligence, Textboxes","key":"12596_CR34","DOI":"10.1609\/aaai.v31i1.11196"},{"issue":"8","key":"12596_CR35","doi-asserted-by":"publisher","first-page":"3676","DOI":"10.1109\/TIP.2018.2825107","volume":"27","author":"M Liao","year":"2018","unstructured":"Liao M, Shi B, Bai X (2018) Textboxes++: a single-shot oriented scene text detector. IEEE Trans Image Process 27(8):3676\u20133690","journal-title":"IEEE Trans Image Process"},{"issue":"1","key":"12596_CR36","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1007\/s005300050006","volume":"8","author":"R Lienhart","year":"2000","unstructured":"Lienhart R, Effelsberg W (2000) Automatic text segmentation and text recognition for video indexing. Multimedia Systems 8(1):69\u201381","journal-title":"Multimedia Systems"},{"doi-asserted-by":"crossref","unstructured":"Liu W, Anguelov D, Erhan D, Szegedy C, Reed S, Fu CY, Berg AC (2016) Ssd: single shot multibox detector. In European conference on computer vision (pp. 21-37). Springer, Cham.","key":"12596_CR37","DOI":"10.1007\/978-3-319-46448-0_2"},{"doi-asserted-by":"crossref","unstructured":"Liu Z, Lin G, Yang S, Liu F, Lin W, Goh WL (2019) Towards robust curve text detection with conditional spatial expansion. In proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 7269-7278).","key":"12596_CR38","DOI":"10.1109\/CVPR.2019.00744"},{"issue":"13","key":"12596_CR39","doi-asserted-by":"publisher","first-page":"18205","DOI":"10.1007\/s11042-019-7177-4","volume":"78","author":"Z Liu","year":"2019","unstructured":"Liu Z, Zhou W, Li H (2019) Scene text detection with fully convolutional neural networks. Multimed Tools Appl 78(13):18205\u201318227","journal-title":"Multimed Tools Appl"},{"key":"12596_CR40","doi-asserted-by":"publisher","first-page":"52669","DOI":"10.1109\/ACCESS.2019.2911964","volume":"7","author":"L Lu","year":"2019","unstructured":"Lu L, Yi Y, Huang F, Wang K, Wang Q (2019) Integrating local CNN and global CNN for script identification in natural scene images. IEEE Access 7:52669\u201352679","journal-title":"IEEE Access"},{"doi-asserted-by":"crossref","unstructured":"Lucas SM (2005) ICDAR 2005 text locating competition results. In eighth international conference on document analysis and recognition (ICDAR'05) (pp. 80-84). IEEE.","key":"12596_CR41","DOI":"10.1109\/ICDAR.2005.231"},{"issue":"2\u20133","key":"12596_CR42","doi-asserted-by":"publisher","first-page":"105","DOI":"10.1007\/s10032-004-0134-3","volume":"7","author":"SM Lucas","year":"2005","unstructured":"Lucas SM, Panaretos A, Sosa L, Tang A, Wong S, Young R, \u2026 Lin X (2005) ICDAR 2003 robust reading competitions: entries, results, and future directions. IJDAR 7(2\u20133):105\u2013122","journal-title":"IJDAR"},{"issue":"10","key":"12596_CR43","doi-asserted-by":"publisher","first-page":"761","DOI":"10.1016\/j.imavis.2004.02.006","volume":"22","author":"J Matas","year":"2004","unstructured":"Matas J, Chum O, Urban M, Pajdla T (2004) Robust wide-baseline stereo from maximally stable extremal regions. Image Vis Comput 22(10):761\u2013767","journal-title":"Image Vis Comput"},{"doi-asserted-by":"crossref","unstructured":"Mei J, Dai L, Shi B, Bai X (2016) Scene text script identification with convolutional recurrent neural networks. In 2016 23rd international conference on pattern recognition (ICPR) (pp. 4053-4058). IEEE.","key":"12596_CR44","DOI":"10.1109\/ICPR.2016.7900268"},{"issue":"2","key":"12596_CR45","doi-asserted-by":"publisher","first-page":"48","DOI":"10.4018\/IJCVIP.2019040104","volume":"9","author":"A Mukhopadhyay","year":"2019","unstructured":"Mukhopadhyay A, Kumar S, Chowdhury SR, Chakraborty N, Mollah AF, Basu S, Sarkar R (2019) Multi-lingual scene text detection using one-class classifier. Int J Comput Vision Image Process (IJCVIP) 9(2):48\u201365","journal-title":"Int J Comput Vision Image Process (IJCVIP)"},{"doi-asserted-by":"crossref","unstructured":"Nayef, N., Yin, F., Bizid, I., Choi, H., Feng, Y., Karatzas, D., ... & Ogier JM (2017). Icdar2017 robust reading challenge on multi-lingual scene text detection and script identification-rrc-mlt. In 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR) (Vol. 1, pp. 1454\u20131459). IEEE.","key":"12596_CR46","DOI":"10.1109\/ICDAR.2017.237"},{"doi-asserted-by":"crossref","unstructured":"Nayef, N., Patel, Y., Busta, M., Chowdhury, P. N., Karatzas, D., Khlif, W., ... & Ogier, J. M. (2019). ICDAR2019 robust reading challenge on multi-lingual scene text detection and recognition\u2014RRC-MLT-2019. In 2019 International Conference on Document Analysis and Recognition (ICDAR) (pp. 1582\u20131587). IEEE.","key":"12596_CR47","DOI":"10.1109\/ICDAR.2019.00254"},{"doi-asserted-by":"crossref","unstructured":"\u00d6zgen AC, Fasounaki M, Ekenel HK (2018) Text detection in natural and computer-generated images. In 2018 26th signal processing and communications applications conference (SIU) (pp. 1-4). IEEE.","key":"12596_CR48","DOI":"10.1109\/SIU.2018.8404600"},{"issue":"13","key":"12596_CR49","doi-asserted-by":"publisher","first-page":"18017","DOI":"10.1007\/s11042-019-7178-3","volume":"78","author":"S Paul","year":"2019","unstructured":"Paul S, Saha S, Basu S, Saha PK, Nasipuri M (2019) Text localization in camera captured images using fuzzy distance transform based adaptive stroke filter. Multimed Tools Appl 78(13):18017\u201318036","journal-title":"Multimed Tools Appl"},{"issue":"4","key":"12596_CR50","doi-asserted-by":"publisher","first-page":"1145","DOI":"10.1109\/TCSVT.2018.2817642","volume":"29","author":"KS Raghunandan","year":"2018","unstructured":"Raghunandan KS, Shivakumara P, Roy S, Kumar GH, Pal U, Lu T (2018) Multi-script-oriented text detection and recognition in video\/scene\/born digital images. IEEE Trans Circ Syst Video Technol 29(4):1145\u20131162","journal-title":"IEEE Trans Circ Syst Video Technol"},{"doi-asserted-by":"crossref","unstructured":"Redmon J, Divvala S, Girshick R, Farhadi A (2016) You only look once: unified, real-time object detection. In proceedings of the IEEE conference on computer vision and pattern recognition (pp. 779-788).","key":"12596_CR51","DOI":"10.1109\/CVPR.2016.91"},{"key":"12596_CR52","doi-asserted-by":"publisher","first-page":"16","DOI":"10.1016\/j.patrec.2020.06.024","volume":"138","author":"S Saha","year":"2020","unstructured":"Saha S, Chakraborty N, Kundu S, Paul S, Mollah AF, Basu S, Sarkar R (2020) Multi-lingual scene text detection and language identification. Pattern Recogn Lett 138:16\u201322","journal-title":"Pattern Recogn Lett"},{"unstructured":"Tarvainen A, Valpola H (2017) Mean teachers are better role models: weight-averaged consistency targets improve semi-supervised deep learning results. arXiv preprint arXiv:1703.01780.","key":"12596_CR53"},{"doi-asserted-by":"crossref","unstructured":"Tian Z, Huang W, He T, He P, Qiao Y (2016) Detecting text in natural image with connectionist text proposal network. In European conference on computer vision (pp. 56-72). Springer, Cham.","key":"12596_CR54","DOI":"10.1007\/978-3-319-46484-8_4"},{"unstructured":"Veit, A., Matera, T., Neumann, L., Matas, J., & Belongie, S. (2016). Coco-text: dataset and benchmark for text detection and recognition in natural images. arXiv preprint arXiv:1601.07140.","key":"12596_CR55"},{"key":"12596_CR56","first-page":"1","volume":"2018","author":"A Voulodimos","year":"2018","unstructured":"Voulodimos A, Doulamis N, Doulamis A, Protopapadakis E (2018) Deep learning for computer vision: a brief review. Comput Intell Neurosci 2018:1\u201313","journal-title":"Comput Intell Neurosci"},{"issue":"2s","key":"12596_CR57","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3341095","volume":"16","author":"SH Wang","year":"2020","unstructured":"Wang SH, Zhang YD (2020) DenseNet-201-based deep neural network with composite learning factor and precomputation for multiple sclerosis classification. ACM Trans Multimedia Comput, Comm, Appl (TOMM) 16(2s):1\u201319","journal-title":"ACM Trans Multimedia Comput, Comm, Appl (TOMM)"},{"unstructured":"Yao C, Bai X, Liu W, Ma Y, Tu Z (2012) Detecting texts of arbitrary orientations in natural images. In 2012 IEEE conference on computer vision and pattern recognition (pp. 1083-1090). IEEE.","key":"12596_CR58"},{"key":"12596_CR59","doi-asserted-by":"publisher","first-page":"310","DOI":"10.1016\/j.neucom.2013.05.037","volume":"122","author":"H Zhang","year":"2013","unstructured":"Zhang H, Zhao K, Song YZ, Guo J (2013) Text extraction from natural scene image: a survey. Neurocomputing 122:310\u2013323","journal-title":"Neurocomputing"},{"doi-asserted-by":"crossref","unstructured":"Zhang Z, Zhang C, Shen W, Yao C, Liu W, Bai X (2016) Multi-oriented text detection with fully convolutional networks. In proceedings of the IEEE conference on computer vision and pattern recognition (pp. 4159-4167).","key":"12596_CR60","DOI":"10.1109\/CVPR.2016.451"},{"issue":"6","key":"12596_CR61","doi-asserted-by":"publisher","first-page":"1407","DOI":"10.1109\/TMI.2018.2823338","volume":"37","author":"Z Zhang","year":"2018","unstructured":"Zhang Z, Liang X, Dong X, Xie Y, Cao G (2018) A sparse-view CT reconstruction method based on combination of DenseNet and deconvolution. IEEE Trans Med Imaging 37(6):1407\u20131417","journal-title":"IEEE Trans Med Imaging"},{"doi-asserted-by":"crossref","unstructured":"Zhou X, Yao C, Wen H, Wang Y, Zhou S, He W, Liang J (2017) East: an efficient and accurate scene text detector. In proceedings of the IEEE conference on computer vision and pattern recognition (pp. 5551-5560).","key":"12596_CR62","DOI":"10.1109\/CVPR.2017.283"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-12596-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-022-12596-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-12596-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,19]],"date-time":"2024-09-19T13:27:50Z","timestamp":1726752470000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-022-12596-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,2,28]]},"references-count":62,"journal-issue":{"issue":"11","published-print":{"date-parts":[[2022,5]]}},"alternative-id":["12596"],"URL":"https:\/\/doi.org\/10.1007\/s11042-022-12596-7","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"type":"print","value":"1380-7501"},{"type":"electronic","value":"1573-7721"}],"subject":[],"published":{"date-parts":[[2022,2,28]]},"assertion":[{"value":"21 April 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 January 2022","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 February 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 February 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors state that there is no conflicts of interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}