{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,10]],"date-time":"2024-09-10T08:51:39Z","timestamp":1725958299436},"publisher-location":"Singapore","reference-count":27,"publisher":"Springer Singapore","isbn-type":[{"type":"print","value":"9789811085291"},{"type":"electronic","value":"9789811085307"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-981-10-8530-7_16","type":"book-chapter","created":{"date-parts":[[2018,2,28]],"date-time":"2018-02-28T15:04:19Z","timestamp":1519830259000},"page":"160-168","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["A Robust End-to-End Neural Network for Scene Text Detection"],"prefix":"10.1007","author":[{"given":"Qi","family":"Yuan","sequence":"first","affiliation":[]},{"given":"Haojie","family":"Li","sequence":"additional","affiliation":[]},{"given":"Zhihui","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Xin","family":"Fan","sequence":"additional","affiliation":[]},{"given":"Zhongxuan","family":"Luo","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,3,1]]},"reference":[{"key":"16_CR1","doi-asserted-by":"crossref","unstructured":"Busta, M., Neumann, L., Matas, J.: FASText: efficient unconstrained scene text detector. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1206\u20131214 (2015)","DOI":"10.1109\/ICCV.2015.143"},{"key":"16_CR2","doi-asserted-by":"crossref","unstructured":"Chen, X., Yuille, A.L.: Detecting and reading text in natural scenes. In: Proceedings of the 2004 IEEE Computer Society Conference on Computer Vision and Pattern Recognition, CVPR 2004, vol. 2, p. II. IEEE (2004)","DOI":"10.1109\/CVPR.2004.1315187"},{"key":"16_CR3","doi-asserted-by":"crossref","unstructured":"Epshtein, B., Ofek, E., Wexler, Y.: Detecting text in natural scenes with stroke width transform. In: 2010 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 2963\u20132970. IEEE (2010)","DOI":"10.1109\/CVPR.2010.5540041"},{"key":"16_CR4","doi-asserted-by":"crossref","unstructured":"Girshick, R.: Fast R-CNN. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1440\u20131448 (2015)","DOI":"10.1109\/ICCV.2015.169"},{"key":"16_CR5","doi-asserted-by":"crossref","unstructured":"Gupta, A., Vedaldi, A., Zisserman, A.: Synthetic data for text localisation in natural images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2315\u20132324 (2016)","DOI":"10.1109\/CVPR.2016.254"},{"issue":"6","key":"16_CR6","doi-asserted-by":"crossref","first-page":"2529","DOI":"10.1109\/TIP.2016.2547588","volume":"25","author":"T He","year":"2016","unstructured":"He, T., Huang, W., Qiao, Y., Yao, J.: Text-attentional convolutional neural network for scene text detection. IEEE Trans. Image Process. 25(6), 2529\u20132541 (2016)","journal-title":"IEEE Trans. Image Process."},{"key":"16_CR7","doi-asserted-by":"crossref","unstructured":"Huang, W., Lin, Z., Yang, J., Wang, J.: Text localization in natural images using stroke feature transform and text covariance descriptors. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1241\u20131248 (2013)","DOI":"10.1109\/ICCV.2013.157"},{"key":"16_CR8","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"497","DOI":"10.1007\/978-3-319-10593-2_33","volume-title":"Computer Vision \u2013 ECCV 2014","author":"W Huang","year":"2014","unstructured":"Huang, W., Qiao, Y., Tang, X.: Robust scene text detection with convolution neural network induced MSER trees. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8692, pp. 497\u2013511. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-10593-2_33"},{"key":"16_CR9","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"512","DOI":"10.1007\/978-3-319-10593-2_34","volume-title":"Computer Vision \u2013 ECCV 2014","author":"M Jaderberg","year":"2014","unstructured":"Jaderberg, M., Vedaldi, A., Zisserman, A.: Deep features for text spotting. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8692, pp. 512\u2013528. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-10593-2_34"},{"key":"16_CR10","doi-asserted-by":"crossref","unstructured":"Karatzas, D., Shafait, F., Uchida, S., Iwamura, M., i Bigorda, L.G., Mestre, S.R., Mas, J., Mota, D.F., Almazan, J.A., de las Heras, L.P.: ICDAR 2013 robust reading competition. In: 2013 12th International Conference on Document Analysis and Recognition (ICDAR), pp. 1484\u20131493. IEEE (2013)","DOI":"10.1109\/ICDAR.2013.221"},{"key":"16_CR11","doi-asserted-by":"crossref","unstructured":"Liao, M., Shi, B., Bai, X., Wang, X., Liu, W.: TextBoxes: a fast text detector with a single deep neural network. arXiv arXiv:1611.06779 (2016)","DOI":"10.1609\/aaai.v31i1.11196"},{"key":"16_CR12","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1007\/978-3-319-46448-0_2","volume-title":"Computer Vision \u2013 ECCV 2016","author":"W Liu","year":"2016","unstructured":"Liu, W., Anguelov, D., Erhan, D., Szegedy, C., Reed, S., Fu, C.-Y., Berg, A.C.: SSD: single shot multibox detector. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9905, pp. 21\u201337. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46448-0_2"},{"issue":"2","key":"16_CR13","doi-asserted-by":"crossref","first-page":"125","DOI":"10.1007\/s10032-015-0237-z","volume":"18","author":"S Lu","year":"2015","unstructured":"Lu, S., Chen, T., Tian, S., Lim, J.H., Tan, C.L.: Scene text extraction based on edges and support vector regression. Int. J. Doc. Anal. Recognit. (IJDAR) 18(2), 125\u2013135 (2015)","journal-title":"Int. J. Doc. Anal. Recognit. (IJDAR)"},{"key":"16_CR14","doi-asserted-by":"crossref","unstructured":"Neumann, L., Matas, J.: Real-time scene text localization and recognition. In: 2012 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 3538\u20133545. IEEE (2012)","DOI":"10.1109\/CVPR.2012.6248097"},{"key":"16_CR15","doi-asserted-by":"crossref","unstructured":"Neumann, L., Matas, J.: Efficient scene text localization and recognition with local character refinement. In: 2015 13th International Conference on Document Analysis and Recognition (ICDAR), pp. 746\u2013750. IEEE (2015)","DOI":"10.1109\/ICDAR.2015.7333861"},{"key":"16_CR16","doi-asserted-by":"crossref","unstructured":"Redmon, J., Divvala, S., Girshick, R., Farhadi, A.: You only look once: unified, real-time object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 779\u2013788 (2016)","DOI":"10.1109\/CVPR.2016.91"},{"key":"16_CR17","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster R-CNN: towards real-time object detection with region proposal networks. In: Advances in Neural Information Processing Systems, pp. 91\u201399 (2015)"},{"key":"16_CR18","doi-asserted-by":"crossref","unstructured":"Shahab, A., Shafait, F., Dengel, A.: ICDAR 2011 robust reading competition challenge 2: reading text in scene images. In: 2011 International Conference on Document Analysis and Recognition (ICDAR), pp. 1491\u20131496. IEEE (2011)","DOI":"10.1109\/ICDAR.2011.296"},{"issue":"2","key":"16_CR19","doi-asserted-by":"crossref","first-page":"107","DOI":"10.1016\/j.patrec.2012.09.019","volume":"34","author":"C Shi","year":"2013","unstructured":"Shi, C., Wang, C., Xiao, B., Zhang, Y., Gao, S.: Scene text detection using graph model built upon maximally stable extremal regions. Pattern Recognit. Lett. 34(2), 107\u2013116 (2013)","journal-title":"Pattern Recognit. Lett."},{"key":"16_CR20","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556 (2014)"},{"key":"16_CR21","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Liu, W., Jia, Y., Sermanet, P., Reed, S., Anguelov, D., Erhan, D., Vanhoucke, V., Rabinovich, A.: Going deeper with convolutions. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1\u20139 (2015)","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"16_CR22","doi-asserted-by":"crossref","unstructured":"Tian, S., Pan, Y., Huang, C., Lu, S., Yu, K., Tan, L.C.: Text flow: a unified text detection system in natural scene images. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 4651\u20134659 (2015)","DOI":"10.1109\/ICCV.2015.528"},{"issue":"4","key":"16_CR23","doi-asserted-by":"crossref","first-page":"280","DOI":"10.1007\/s10032-006-0014-0","volume":"8","author":"C Wolf","year":"2006","unstructured":"Wolf, C., Jolion, J.M.: Object count\/area graphs for the evaluation of object detection and segmentation algorithms. IJDAR 8(4), 280\u2013296 (2006)","journal-title":"IJDAR"},{"issue":"5","key":"16_CR24","doi-asserted-by":"crossref","first-page":"970","DOI":"10.1109\/TPAMI.2013.182","volume":"36","author":"XC Yin","year":"2014","unstructured":"Yin, X.C., Yin, X., Huang, K., Hao, H.W.: Robust text detection in natural scene images. IEEE Trans. Pattern Anal. Mach. Intell. 36(5), 970\u2013983 (2014)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"16_CR25","doi-asserted-by":"crossref","unstructured":"Zhang, H., Kyaw, Z., Chang, S.F., Chua, T.S.: Visual translation embedding network for visual relation detection. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.331"},{"key":"16_CR26","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/2978656","volume":"13","author":"H Zhang","year":"2016","unstructured":"Zhang, H., Shang, X., Luan, H., Wang, M., Chua, T.S.: Learning from collective intelligence: feature learning using social images and tags. ACM Trans. Multimed. Comput. Commun. Appl. (TOMM) 13, 1 (2016)","journal-title":"ACM Trans. Multimed. Comput. Commun. Appl. (TOMM)"},{"key":"16_CR27","doi-asserted-by":"crossref","unstructured":"Zhang, Z., Shen, W., Yao, C., Bai, X.: Symmetry-based text line detection in natural scenes. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2558\u20132567 (2015)","DOI":"10.1109\/CVPR.2015.7298871"}],"container-title":["Communications in Computer and Information Science","Internet Multimedia Computing and Service"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-10-8530-7_16","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,15]],"date-time":"2022-08-15T01:04:14Z","timestamp":1660525454000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-981-10-8530-7_16"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9789811085291","9789811085307"],"references-count":27,"URL":"https:\/\/doi.org\/10.1007\/978-981-10-8530-7_16","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"type":"print","value":"1865-0929"},{"type":"electronic","value":"1865-0937"}],"subject":[],"published":{"date-parts":[[2018]]}}}