{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,25]],"date-time":"2025-03-25T14:44:34Z","timestamp":1742913874903,"version":"3.40.3"},"publisher-location":"Cham","reference-count":30,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783031216473"},{"type":"electronic","value":"9783031216480"}],"license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-031-21648-0_32","type":"book-chapter","created":{"date-parts":[[2022,11,25]],"date-time":"2022-11-25T00:05:14Z","timestamp":1669334714000},"page":"468-483","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Synthetic Data Generation for\u00a0Semantic Segmentation of\u00a0Lecture Videos"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6308-7113","authenticated-orcid":false,"given":"Kenny","family":"Davila","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9353-9528","authenticated-orcid":false,"given":"Fei","family":"Xu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5221-2692","authenticated-orcid":false,"given":"James","family":"Molina","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7118-9280","authenticated-orcid":false,"given":"Srirangaraj","family":"Setlur","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5318-7409","authenticated-orcid":false,"given":"Venu","family":"Govindaraju","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,11,25]]},"reference":[{"key":"32_CR1","doi-asserted-by":"crossref","unstructured":"Cagliero, L., Canale, L., Farinetti, L.: Visa: a supervised approach to indexing video lectures with semantic annotations. In: 2019 IEEE 43rd Annual Computer Software and Applications Conference (COMPSAC), vol. 1, pp. 226\u2013235. IEEE (2019)","DOI":"10.1109\/COMPSAC.2019.00041"},{"key":"32_CR2","doi-asserted-by":"crossref","unstructured":"Ch\u2019ng, C.K., Chan, C.S.: Total-text: a comprehensive dataset for scene text detection and recognition. In: 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR), vol. 1, pp. 935\u2013942. IEEE (2017)","DOI":"10.1109\/ICDAR.2017.157"},{"key":"32_CR3","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"681","DOI":"10.1007\/978-3-030-15712-8_44","volume-title":"Advances in Information Retrieval","author":"K Davila","year":"2019","unstructured":"Davila, K., Joshi, R., Setlur, S., Govindaraju, V., Zanibbi, R.: Tangent-V: math formula image search using line-of-sight graphs. In: Azzopardi, L., Stein, B., Fuhr, N., Mayr, P., Hauff, C., Hiemstra, D. (eds.) ECIR 2019. LNCS, vol. 11437, pp. 681\u2013695. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-15712-8_44"},{"key":"32_CR4","doi-asserted-by":"publisher","first-page":"104469","DOI":"10.1109\/ACCESS.2021.3099427","volume":"9","author":"K Davila","year":"2021","unstructured":"Davila, K., Xu, F., Setlur, S., Govindaraju, V.: Fcn-lecturenet: extractive summarization of whiteboard and chalkboard lecture videos. IEEE Access 9, 104469\u2013104484 (2021)","journal-title":"IEEE Access"},{"key":"32_CR5","doi-asserted-by":"crossref","unstructured":"Davila, K., Zanibbi, R.: Whiteboard video summarization via spatio-temporal conflict minimization. In: 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR), vol. 1, pp. 355\u2013362. IEEE (2017)","DOI":"10.1109\/ICDAR.2017.66"},{"key":"32_CR6","doi-asserted-by":"crossref","unstructured":"Davila, K., Zanibbi, R.: Visual search engine for handwritten and typeset math in lecture videos and latex notes. In: 2018 16th International Conference on Frontiers in Handwriting Recognition (ICFHR), pp. 50\u201355. IEEE (2018)","DOI":"10.1109\/ICFHR-2018.2018.00018"},{"key":"32_CR7","doi-asserted-by":"crossref","unstructured":"Deng, D., Liu, H., Li, X., Cai, D.: Pixellink: detecting scene text via instance segmentation. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 32 (2018)","DOI":"10.1609\/aaai.v32i1.12269"},{"key":"32_CR8","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1007\/978-3-030-86198-8_7","volume-title":"Document Analysis and Recognition \u2013 ICDAR 2021 Workshops","author":"A Dey","year":"2021","unstructured":"Dey, A., Zanibbi, R.: ScanSSD-XYc: faster detection for math formulas. In: Barney Smith, E.H., Pal, U. (eds.) ICDAR 2021. LNCS, vol. 12916, pp. 91\u201396. Springer, Cham (2021). https:\/\/doi.org\/10.1007\/978-3-030-86198-8_7"},{"key":"32_CR9","doi-asserted-by":"crossref","unstructured":"Dutta, K., Mathew, M., Krishnan, P., Jawahar, C.: Localizing and recognizing text in lecture videos. In: 2018 16th International Conference on Frontiers in Handwriting Recognition (ICFHR), pp. 235\u2013240. IEEE (2018)","DOI":"10.1109\/ICFHR-2018.2018.00049"},{"key":"32_CR10","doi-asserted-by":"crossref","unstructured":"Guan, M., Ding, H., Chen, K., Huo, Q.: Improving handwritten OCR with augmented text line images synthesized from online handwriting samples by style-conditioned GAN. In: 2020 17th International Conference on Frontiers in Handwriting Recognition (ICFHR), pp. 151\u2013156. IEEE (2020)","DOI":"10.1109\/ICFHR2020.2020.00037"},{"key":"32_CR11","doi-asserted-by":"crossref","unstructured":"Gupta, A., Vedaldi, A., Zisserman, A.: Synthetic data for text localisation in natural images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2315\u20132324 (2016)","DOI":"10.1109\/CVPR.2016.254"},{"issue":"16","key":"32_CR12","doi-asserted-by":"publisher","first-page":"7610","DOI":"10.3390\/app11167610","volume":"11","author":"KA Hashmi","year":"2021","unstructured":"Hashmi, K.A., Pagani, A., Liwicki, M., Stricker, D., Afzal, M.Z.: Cascade network with deformable composite backbone for formula detection in scanned document images. Appl. Sci. 11(16), 7610 (2021)","journal-title":"Appl. Sci."},{"key":"32_CR13","doi-asserted-by":"crossref","unstructured":"Haurilet, M., Roitberg, A., Martinez, M., Stiefelhagen, R.: Wise-slide segmentation in the wild. In: 2019 International Conference on Document Analysis and Recognition (ICDAR), pp. 343\u2013348. IEEE (2019)","DOI":"10.1109\/ICDAR.2019.00062"},{"key":"32_CR14","doi-asserted-by":"crossref","unstructured":"He, K., Gkioxari, G., Doll\u00e1r, P., Girshick, R.: Mask r-cnn. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2961\u20132969 (2017)","DOI":"10.1109\/ICCV.2017.322"},{"key":"32_CR15","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"32_CR16","doi-asserted-by":"crossref","unstructured":"Husain, M., Meena, S.: Multimodal fusion of speech and text using semi-supervised LDA for indexing lecture videos. In: 2019 National Conference on Communications (NCC), pp. 1\u20136. IEEE (2019)","DOI":"10.1109\/NCC.2019.8732253"},{"key":"32_CR17","doi-asserted-by":"crossref","unstructured":"Liao, M., Wan, Z., Yao, C., Chen, K., Bai, X.: Real-time scene text detection with differentiable binarization. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 34, pp. 11474\u201311481 (2020)","DOI":"10.1609\/aaai.v34i07.6812"},{"key":"32_CR18","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Doll\u00e1r, P., Girshick, R., He, K., Hariharan, B., Belongie, S.: Feature pyramid networks for object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2117\u20132125 (2017)","DOI":"10.1109\/CVPR.2017.106"},{"key":"32_CR19","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"740","DOI":"10.1007\/978-3-319-10602-1_48","volume-title":"Computer Vision \u2013 ECCV 2014","author":"T-Y Lin","year":"2014","unstructured":"Lin, T.-Y., et al.: Microsoft COCO: common objects in context. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8693, pp. 740\u2013755. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-10602-1_48"},{"issue":"1","key":"32_CR20","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1007\/s11263-020-01369-0","volume":"129","author":"S Long","year":"2021","unstructured":"Long, S., He, X., Yao, C.: Scene text detection and recognition: the deep learning era. Int. J. Comput. Vis. 129(1), 161\u2013184 (2021). https:\/\/doi.org\/10.1007\/s11263-020-01369-0","journal-title":"Int. J. Comput. Vis."},{"key":"32_CR21","doi-asserted-by":"crossref","unstructured":"Mahdavi, M., Zanibbi, R., Mouchere, H., Viard-Gaudin, C., Garain, U.: ICDAR 2019 CROHME+ TFD: competition on recognition of handwritten mathematical expressions and typeset formula detection. In: 2019 International Conference on Document Analysis and Recognition (ICDAR), pp. 1533\u20131538. IEEE (2019)","DOI":"10.1109\/ICDAR.2019.00247"},{"issue":"1","key":"32_CR22","doi-asserted-by":"publisher","first-page":"39","DOI":"10.1007\/s100320200071","volume":"5","author":"UV Marti","year":"2002","unstructured":"Marti, U.V., Bunke, H.: The iam-database: an English sentence database for offline handwriting recognition. Int. J. Doc. Anal. Recogn. 5(1), 39\u201346 (2002)","journal-title":"Int. J. Doc. Anal. Recogn."},{"key":"32_CR23","doi-asserted-by":"publisher","first-page":"83663","DOI":"10.1109\/ACCESS.2020.2992067","volume":"8","author":"BH Phong","year":"2020","unstructured":"Phong, B.H., Hoang, T.M., Le, T.L.: A hybrid method for mathematical expression detection in scientific document images. IEEE Access 8, 83663\u201383684 (2020)","journal-title":"IEEE Access"},{"key":"32_CR24","doi-asserted-by":"crossref","unstructured":"Pratikakis, I., Zagoris, K., Barlas, G., Gatos, B.: ICFHR 2016 handwritten document image binarization contest (H-DIBCO 2016). In: 2016 15th International Conference on Frontiers in Handwriting Recognition (ICFHR), pp. 619\u2013623. IEEE (2016)","DOI":"10.1109\/ICFHR.2016.0118"},{"key":"32_CR25","doi-asserted-by":"crossref","unstructured":"Springstein, M., M\u00fcller-Budack, E., Ewerth, R.: Unsupervised training data generation of handwritten formulas using generative adversarial networks with self-attention. In: Proceedings of the 2021 Workshop on Multi-Modal Pre-Training for Multimedia Understanding, pp. 46\u201354 (2021)","DOI":"10.1145\/3463945.3469059"},{"key":"32_CR26","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1016\/j.patrec.2019.11.001","volume":"129","author":"M Villamizar","year":"2020","unstructured":"Villamizar, M., Can\u00e9vet, O., Odobez, J.M.: Multi-scale sequential network for semantic text segmentation and localization. Pattern Recogn. Lett. 129, 63\u201369 (2020)","journal-title":"Pattern Recogn. Lett."},{"key":"32_CR27","doi-asserted-by":"crossref","unstructured":"Wang, W., et al.: Shape robust text detection with progressive scale expansion network. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9336\u20139345 (2019)","DOI":"10.1109\/CVPR.2019.00956"},{"key":"32_CR28","doi-asserted-by":"crossref","unstructured":"Wolf, F., Brandenbusch, K., Fink, G.A.: Improving handwritten word synthesis for annotation-free word spotting. In: 2020 17th International Conference on Frontiers in Handwriting Recognition (ICFHR), pp. 61\u201366. IEEE (2020)","DOI":"10.1109\/ICFHR2020.2020.00022"},{"key":"32_CR29","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"109","DOI":"10.1007\/978-3-030-86337-1_8","volume-title":"Document Analysis and Recognition \u2013 ICDAR 2021","author":"M Yim","year":"2021","unstructured":"Yim, M., Kim, Y., Cho, H.-C., Park, S.: SynthTIGER: synthetic text image GEneratoR towards better text recognition models. In: Llad\u00f3s, J., Lopresti, D., Uchida, S. (eds.) ICDAR 2021. LNCS, vol. 12824, pp. 109\u2013124. Springer, Cham (2021). https:\/\/doi.org\/10.1007\/978-3-030-86337-1_8"},{"key":"32_CR30","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107336","volume":"110","author":"Y Zhu","year":"2021","unstructured":"Zhu, Y., Du, J.: Textmountain: accurate scene text detection via instance segmentation. Pattern Recogn. 110, 107336 (2021)","journal-title":"Pattern Recogn."}],"container-title":["Lecture Notes in Computer Science","Frontiers in Handwriting Recognition"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-21648-0_32","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,13]],"date-time":"2024-03-13T14:54:12Z","timestamp":1710341652000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-21648-0_32"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"ISBN":["9783031216473","9783031216480"],"references-count":30,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-21648-0_32","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2022]]},"assertion":[{"value":"25 November 2022","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICFHR","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Frontiers in Handwriting Recognition","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Hyderabad","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"India","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2022","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 December 2022","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"7 December 2022","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icfhr2022","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/icfhr2022.org","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Easychair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"61","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"36","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"59% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"4","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}