{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,13]],"date-time":"2026-02-13T20:35:00Z","timestamp":1771014900720,"version":"3.50.1"},"reference-count":82,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"8","license":[{"start":{"date-parts":[[2017,8,1]],"date-time":"2017-08-01T00:00:00Z","timestamp":1501545600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"funder":[{"name":"Dutch National Program"},{"name":"COMMIT"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. on Image Process."],"published-print":{"date-parts":[[2017,8]]},"DOI":"10.1109\/tip.2017.2707805","type":"journal-article","created":{"date-parts":[[2017,5,24]],"date-time":"2017-05-24T18:13:04Z","timestamp":1495649584000},"page":"3965-3980","source":"Crossref","is-referenced-by-count":35,"title":["Con-Text: Text Detection for Fine-Grained Object Classification"],"prefix":"10.1109","volume":"26","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-9073-9420","authenticated-orcid":false,"given":"Sezer","family":"Karaoglu","sequence":"first","affiliation":[]},{"given":"Ran","family":"Tao","sequence":"additional","affiliation":[]},{"given":"Jan C.","family":"van Gemert","sequence":"additional","affiliation":[]},{"given":"Theo","family":"Gevers","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2005.09.010"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1007\/s10032-015-0240-4"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2015.7333753"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0823-z"},{"key":"ref76","first-page":"52","article-title":"TRECVID 2014&#x2014;An overview of the goals, tasks, data, evaluation mechanisms and metrics","author":"over","year":"2014","journal-title":"Proc TRECVID"},{"key":"ref77","first-page":"391","article-title":"Edge boxes: Locating object proposals from edges","author":"zitnick","year":"2014","journal-title":"Proc ECCV"},{"key":"ref74","article-title":"TRECVID 2004 search and feature extraction task by NUS PRIS","author":"chua","year":"2004","journal-title":"Proc NIST TRECVID Workshop"},{"key":"ref39","doi-asserted-by":"crossref","first-page":"2296","DOI":"10.1109\/TIP.2013.2249082","article-title":"Scene text detection via connected component clustering and nontext filtering","volume":"22","author":"koo","year":"2013","journal-title":"IEEE Trans Image Process"},{"key":"ref75","article-title":"KU-ISPL TRECVID 2015 multimedia event detection system","author":"lee","year":"2014","journal-title":"Proc TRECVID"},{"key":"ref38","first-page":"29","article-title":"Geodesic saliency using background priors","author":"wei","year":"2012","journal-title":"Proc ECCV"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2004.02.006"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298778"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/DAS.2012.42"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1145\/1180639.1180698"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2009.112"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2009.5457577"},{"key":"ref37","author":"veit","year":"2016","journal-title":"COCO-text Dataset and benchmark for text detection and recognition in natural images"},{"key":"ref36","first-page":"740","article-title":"Microsoft COCO: Common objects in context","author":"lin","year":"2014","journal-title":"Proc ECCV"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298710"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-38628-2_35"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1145\/1631272.1631361"},{"key":"ref62","first-page":"1083","article-title":"Detecting texts of arbitrary orientations in natural images","author":"yao","year":"2012","journal-title":"Proc CVPR"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2014.2353813"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1145\/2393347.2396358"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2006.42"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.269"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2014.2317980"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1145\/2461466.2461486"},{"key":"ref66","doi-asserted-by":"crossref","first-page":"2594","DOI":"10.1109\/TIP.2011.2126586","article-title":"Text string detection from natural scenes by structure-based partition and grouping","volume":"20","author":"yi","year":"2011","journal-title":"IEEE Trans Image Process"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-013-0620-5"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1145\/1991996.1992021"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2006.68"},{"key":"ref69","doi-asserted-by":"crossref","first-page":"125","DOI":"10.1007\/s10032-015-0237-z","article-title":"Scene text extraction based on edges and support vector regression","volume":"18","author":"lu","year":"2015","journal-title":"Int J Document Anal Recognit"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/2502081.2502197"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33885-4_46"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2010.12.004"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6248097"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/2072298.2071930"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206816"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1023\/A:1023052124951"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1016\/j.visres.2010.01.002"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2009.5459462"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2006.3"},{"key":"ref59","first-page":"3466","article-title":"A codebook-free and annotation-free approach for fine-grained image categorization","author":"yao","year":"2012","journal-title":"Proc CVPR"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2013.221"},{"key":"ref57","first-page":"682","article-title":"ICDAR 2003 robust reading competitions","author":"lucas","year":"2005","journal-title":"Proc IJDAR"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-71496-5_44"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2014.2302896"},{"key":"ref54","first-page":"512","article-title":"Deep features for text spotting","author":"jaderberg","year":"2014","journal-title":"Proc ECCV"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2004.1334351"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2009.5459240"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2010.02.004"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2007.4408986"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2010.2070803"},{"key":"ref12","doi-asserted-by":"crossref","first-page":"353","DOI":"10.1109\/TPAMI.2010.70","article-title":"Learning to detect a salient object","volume":"33","author":"liu","year":"2011","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4471-6515-6_9"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4471-6515-6"},{"key":"ref15","first-page":"157","article-title":"Scene text recognition: No country for old men?","author":"g\u00f3mez","year":"2014","journal-title":"Proc ACCV Workshops"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2015.7333888"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/DAS.2014.44"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2014.2339814"},{"key":"ref17","doi-asserted-by":"crossref","first-page":"331","DOI":"10.1007\/s10032-014-0225-8","article-title":"Multimodal page classification in administrative document image streams","volume":"17","author":"rusi\u00f1ol","year":"2014","journal-title":"Int J Document Anal Recognit"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1117\/12.643463"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/BF01214362"},{"key":"ref80","author":"tolias","year":"2015","journal-title":"Particular object retrieval with integral max-pooling of cnn activations"},{"key":"ref4","first-page":"1457","article-title":"End-to-end scene text recognition","author":"wang","year":"2011","journal-title":"Proc ICCV"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2010.5540041"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-014-0733-5"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2011.144"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-014-0741-5"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.378"},{"key":"ref49","first-page":"144","article-title":"Extreme value theory based text binarization in documents and natural scenes","author":"fernando","year":"2010","journal-title":"Proc ICMV"},{"key":"ref9","first-page":"834","article-title":"Part-based R-CNNs for fine-grained category detection","author":"zhang","year":"2014","journal-title":"Proc ECCV"},{"key":"ref46","article-title":"OpenScan: A fully transparent optical scan voting system","author":"wang","year":"2010","journal-title":"Proceedings of Electronic Voting Technology Workshop"},{"key":"ref45","first-page":"2733","article-title":"The attraction of visual attention to texts in real-world scenes","author":"wang","year":"2011","journal-title":"Proc 3rd Annu Meeting of the Cogn Sci Soc"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1145\/1991996.1992010"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2007.40"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2011.168"},{"key":"ref41","first-page":"770","article-title":"A method for text localization and recognition in real-world images","author":"neumann","year":"2010","journal-title":"Proc ACCV"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2010.971"},{"key":"ref43","first-page":"3304","article-title":"End-to-end text recognition with convolutional neural networks","author":"wang","year":"2012","journal-title":"Proc ICPR"}],"container-title":["IEEE Transactions on Image Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/83\/7935144\/07933250.pdf?arnumber=7933250","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,12]],"date-time":"2022-01-12T16:14:39Z","timestamp":1642004079000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7933250\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,8]]},"references-count":82,"journal-issue":{"issue":"8"},"URL":"https:\/\/doi.org\/10.1109\/tip.2017.2707805","relation":{},"ISSN":["1057-7149","1941-0042"],"issn-type":[{"value":"1057-7149","type":"print"},{"value":"1941-0042","type":"electronic"}],"subject":[],"published":{"date-parts":[[2017,8]]}}}