{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,12]],"date-time":"2026-05-12T15:45:13Z","timestamp":1778600713242,"version":"3.51.4"},"reference-count":35,"publisher":"Springer Science and Business Media LLC","issue":"9","license":[{"start":{"date-parts":[[2023,11,25]],"date-time":"2023-11-25T00:00:00Z","timestamp":1700870400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,11,25]],"date-time":"2023-11-25T00:00:00Z","timestamp":1700870400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2024,9]]},"DOI":"10.1007\/s00371-023-03156-7","type":"journal-article","created":{"date-parts":[[2023,11,25]],"date-time":"2023-11-25T13:02:14Z","timestamp":1700917334000},"page":"6111-6122","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Answer sheet layout analysis based on YOLOv5s-DC and MSER"],"prefix":"10.1007","volume":"40","author":[{"given":"PengBin","family":"Fu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xu","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7984-3953","authenticated-orcid":false,"given":"HuiRong","family":"Yang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,11,25]]},"reference":[{"key":"3156_CR1","unstructured":"Higgins, E., Tatham, L.: Exploring the potential of multiple-choice questions in assessments. Learn. Teach. Action 2 (2003)"},{"key":"3156_CR2","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3012542","author":"J Memon","year":"2020","unstructured":"Memon, J., Sami, M., Khan, R.A., Uddin, M.: Handwritten optical character recognition (ocr): a comprehensive systematic literature review (slr). IEEE Access (2020). https:\/\/doi.org\/10.1109\/ACCESS.2020.3012542","journal-title":"IEEE Access"},{"key":"3156_CR3","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2018.2844689","author":"J Zhang","year":"2019","unstructured":"Zhang, J., Du, J., Dai, L.: Track, attend, and parse (tap): an end-to-end framework for online handwritten mathematical expression recognition. IEEE Trans. Multimed. (2019). https:\/\/doi.org\/10.1109\/TMM.2018.2844689","journal-title":"IEEE Trans. Multimed."},{"key":"3156_CR4","doi-asserted-by":"publisher","unstructured":"Truong, T.N., Nguyen, C.T., Phan, K.M., Nakagawa, M.: Improvement of end-to-end offline handwritten mathematical expression recognition by weakly supervised learning, vol. 2020 (2020). https:\/\/doi.org\/10.1109\/ICFHR2020.2020.00042","DOI":"10.1109\/ICFHR2020.2020.00042"},{"key":"3156_CR5","doi-asserted-by":"publisher","DOI":"10.1109\/MCI.2018.2840738","author":"T Young","year":"2018","unstructured":"Young, T., Hazarika, D., Poria, S., Cambria, E.: Recent trends in deep learning based natural language processing [review article]. IEEE Comput. Intell. Mag. (2018). https:\/\/doi.org\/10.1109\/MCI.2018.2840738","journal-title":"IEEE Comput. Intell. Mag."},{"key":"3156_CR6","doi-asserted-by":"publisher","unstructured":"Yepes, A.J., Zhong, P., Burdick, D.: ICDAR 2021 competition on scientific literature parsing, vol. 12824 LNCS (2021). https:\/\/doi.org\/10.1007\/978-3-030-86337-1_40","DOI":"10.1007\/978-3-030-86337-1_40"},{"key":"3156_CR7","doi-asserted-by":"publisher","DOI":"10.1007\/s00371-020-01927-0","author":"RP Kaur","year":"2021","unstructured":"Kaur, R.P., Jindal, M.K., Kumar, M.: Text and graphics segmentation of newspapers printed in gurmukhi script: a hybrid approach. Vis. Comput. (2021). https:\/\/doi.org\/10.1007\/s00371-020-01927-0","journal-title":"Vis. Comput."},{"key":"3156_CR8","doi-asserted-by":"publisher","unstructured":"Palm, R.B., Winther, O., Laws, F.: Cloudscan\u2014A Configuration-Free Invoice Analysis System Using Recurrent Neural Networks, vol. 1 (2017). https:\/\/doi.org\/10.1109\/ICDAR.2017.74","DOI":"10.1109\/ICDAR.2017.74"},{"key":"3156_CR9","first-page":"21002","volume":"33","author":"X Li","year":"2020","unstructured":"Li, X., Wang, W., Wu, L., Chen, S., Hu, X., Li, J., Tang, J., Yang, J.: Generalized focal loss: learning qualified and distributed bounding boxes for dense object detection. Adv. Neural. Inf. Process. Syst. 33, 21002\u201321012 (2020)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"3156_CR10","doi-asserted-by":"publisher","first-page":"146","DOI":"10.1016\/j.neucom.2022.07.042","volume":"506","author":"Y-F Zhang","year":"2022","unstructured":"Zhang, Y.-F., Ren, W., Zhang, Z., Jia, Z., Wang, L., Tan, T.: Focal and efficient iou loss for accurate bounding box regression. Neurocomputing 506, 146\u2013157 (2022)","journal-title":"Neurocomputing"},{"key":"3156_CR11","doi-asserted-by":"publisher","unstructured":"Ha, J., Haralick, R.M., Phillips, I.T.: Recursive x-y cut using bounding boxes of connected components. In Proceedings of the International Conference on Document Analysis and Recognition, ICDAR, vol. 2 (1995). https:\/\/doi.org\/10.1109\/ICDAR.1995.602059","DOI":"10.1109\/ICDAR.1995.602059"},{"key":"3156_CR12","unstructured":"Pavlidis, T.: Page segmentation by white streams. In: Proceedings of the 1st ICDAR, pp. 945\u2013953 (1991)"},{"issue":"11","key":"3156_CR13","doi-asserted-by":"publisher","first-page":"1162","DOI":"10.1109\/34.244677","volume":"15","author":"L O\u2019Gorman","year":"1993","unstructured":"O\u2019Gorman, L.: The document spectrum for page layout analysis. IEEE Trans. Pattern Anal. Mach. Intell. 15(11), 1162\u20131173 (1993)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"4","key":"3156_CR14","doi-asserted-by":"publisher","first-page":"375","DOI":"10.1016\/0146-664X(82)90059-4","volume":"20","author":"FM Wahl","year":"1982","unstructured":"Wahl, F.M., Wong, K.Y., Casey, R.G.: Block segmentation and text extraction in mixed text\/image documents. Comput. Graphics Image Process. 20(4), 375\u2013390 (1982)","journal-title":"Comput. Graphics Image Process."},{"key":"3156_CR15","doi-asserted-by":"publisher","unstructured":"Kasar, T., Barlas, P., Adam, S., Chatelain, C., Paquet, T.: Learning to detect tables in scanned document images using line information. In 2013 12th International Conference on Document Analysis and Recognition, pp. 1185\u20131189 (2013). https:\/\/doi.org\/10.1109\/ICDAR.2013.240","DOI":"10.1109\/ICDAR.2013.240"},{"key":"3156_CR16","doi-asserted-by":"publisher","unstructured":"Chen, K., Seuret, M., Hennebert, J., Ingold, R.: Convolutional Neural Networks for Page Segmentation of Historical Document Images, vol. 01, pp. 965\u2013970 (2017). https:\/\/doi.org\/10.1109\/ICDAR.2017.161","DOI":"10.1109\/ICDAR.2017.161"},{"key":"3156_CR17","doi-asserted-by":"publisher","unstructured":"Shelhamer, E., Long, J., Darrell, T.: Fully Convolutional Networks for Semantic Segmentation, vol. 39, pp. 640\u2013651 (2017). https:\/\/doi.org\/10.1109\/TPAMI.2016.2572683","DOI":"10.1109\/TPAMI.2016.2572683"},{"key":"3156_CR18","doi-asserted-by":"publisher","first-page":"640","DOI":"10.1109\/TPAMI.2016.2572683","volume":"39","author":"E Shelhamer","year":"2017","unstructured":"Shelhamer, E., Long, J., Darrell, T.: Fully convolutional networks for semantic segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 39, 640\u2013651 (2017). https:\/\/doi.org\/10.1109\/TPAMI.2016.2572683","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"3156_CR19","doi-asserted-by":"publisher","unstructured":"Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR), vol. 01, pp. 1162\u20131167 (2017). https:\/\/doi.org\/10.1109\/ICDAR.2017.192","DOI":"10.1109\/ICDAR.2017.192"},{"key":"3156_CR20","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2577031","author":"S Ren","year":"2017","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster r-cnn: Towards real-time object detection with region proposal networks. IEEE Trans. Pattern Anal. Mach. Intell. (2017). https:\/\/doi.org\/10.1109\/TPAMI.2016.2577031","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"3156_CR21","doi-asserted-by":"crossref","unstructured":"Zhang, Z., Ma, J., Du, J., Wang, L., Zhang, J.: Multimodal pre-training based on graph attention network for document understanding. IEEE Trans. Multimed. (2022)","DOI":"10.1109\/TMM.2022.3214102"},{"issue":"1","key":"3156_CR22","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1007\/s42979-022-01414-4","volume":"4","author":"K Jobin","year":"2022","unstructured":"Jobin, K., Mondal, A., Jawahar, C.: Document image analysis using deep multi-modular features. SN Comput. Sci. 4(1), 5 (2022)","journal-title":"SN Comput. Sci."},{"key":"3156_CR23","doi-asserted-by":"publisher","first-page":"16197","DOI":"10.1007\/s11227-022-04525-0","volume":"78","author":"M Ponnusamy","year":"2022","unstructured":"Ponnusamy, M., BediP, S.T..e.a: Design and analysis of text document clustering using salp swarm algorithm. J. Supercomput. 78, 16197\u201316213 (2022)","journal-title":"J. Supercomput."},{"key":"3156_CR24","doi-asserted-by":"publisher","unstructured":"Matas, J., Chum, O., Urban, M., Pajdla, T.: Robust Wide-Baseline Stereo from Maximally Stable Extremal Regions, vol. 22 (2004). https:\/\/doi.org\/10.1016\/j.imavis.2004.02.006","DOI":"10.1016\/j.imavis.2004.02.006"},{"key":"3156_CR25","doi-asserted-by":"publisher","first-page":"755","DOI":"10.1007\/s00138-017-0837-3","volume":"28","author":"Y Song","year":"2017","unstructured":"Song, Y., Chen, J., Xie, H., Chen, Z., Gao, X., Chen, X.: Robust and parallel uyghur text localization in complex background images. Mach. Vis. Appl. 28, 755\u2013769 (2017). https:\/\/doi.org\/10.1007\/s00138-017-0837-3","journal-title":"Mach. Vis. Appl."},{"key":"3156_CR26","unstructured":"Hudson, L.: Pyzbar (2019). https:\/\/pypi.org\/project\/pyzbar\/ Accessed January 5, 2023"},{"key":"3156_CR27","doi-asserted-by":"publisher","DOI":"10.1145\/361237.361242","author":"RO Duda","year":"1972","unstructured":"Duda, R.O., Hart, P.E.: Use of the hough transformation to detect lines and curves in pictures. Commun. ACM (1972). https:\/\/doi.org\/10.1145\/361237.361242","journal-title":"Commun. ACM"},{"issue":"2","key":"3156_CR28","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1023\/B:VISI.0000029664.99615.94","volume":"60","author":"DG Low","year":"2004","unstructured":"Low, D.G.: Distinctive image features from scale-invariant keypoints. Int. J. Comput. Vis. 60(2), 91\u2013110 (2004)","journal-title":"Int. J. Comput. Vis."},{"key":"3156_CR29","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1967.1053964","author":"TM Cover","year":"1967","unstructured":"Cover, T.M., Hart, P.E.: Nearest neighbor pattern classification. IEEE Trans. Inf. Theory (1967). https:\/\/doi.org\/10.1109\/TIT.1967.1053964","journal-title":"IEEE Trans. Inf. Theory"},{"key":"3156_CR30","doi-asserted-by":"publisher","unstructured":"Liu, S., Qi, L., Qin, H., Shi, J., Jia, J.: Path Aggregation Network for Instance Segmentation (2018). https:\/\/doi.org\/10.1109\/CVPR.2018.00913","DOI":"10.1109\/CVPR.2018.00913"},{"key":"3156_CR31","doi-asserted-by":"crossref","unstructured":"Redmon, J., Divvala, S., Girshick, R., Farhadi, A.: You only look once: unified, real-time object detection. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 779\u2013788 (2016)","DOI":"10.1109\/CVPR.2016.91"},{"key":"3156_CR32","unstructured":"Xu, S., Wang, X., Lv, W., Chang, Q., Cui, C., Deng, K., Wang, G., Dang, Q., Wei, S., Du, Y., et al.: PP-YOLOE: an evolved version of yolo. arXiv preprint arXiv:2203.16250 (2022)"},{"key":"3156_CR33","doi-asserted-by":"publisher","DOI":"10.1145\/1276377.1276390","author":"S Avidan","year":"2007","unstructured":"Avidan, S., Shamir, A.: Seam carving for content-aware image resizing. ACM Trans. Graph. (2007). https:\/\/doi.org\/10.1145\/1276377.1276390","journal-title":"ACM Trans. Graph."},{"key":"3156_CR34","unstructured":"Bochkovskiy, A., Wang, C.-Y., Liao, H.-Y.M.: Yolov4: optimal speed and accuracy of object detection (2020) arXiv preprint arXiv:2004.10934"},{"key":"3156_CR35","doi-asserted-by":"publisher","unstructured":"Wang, C.-Y., Bochkovskiy, A., Liao, H.-Y.M.: YOLOv7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors (2022) https:\/\/doi.org\/10.48550\/ARXIV.2207.02696","DOI":"10.48550\/ARXIV.2207.02696"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-023-03156-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-023-03156-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-023-03156-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,13]],"date-time":"2024-08-13T15:10:36Z","timestamp":1723561836000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-023-03156-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,11,25]]},"references-count":35,"journal-issue":{"issue":"9","published-print":{"date-parts":[[2024,9]]}},"alternative-id":["3156"],"URL":"https:\/\/doi.org\/10.1007\/s00371-023-03156-7","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,11,25]]},"assertion":[{"value":"29 October 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 November 2023","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}