{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,5]],"date-time":"2026-02-05T12:30:43Z","timestamp":1770294643739,"version":"3.49.0"},"publisher-location":"Cham","reference-count":55,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031726972","type":"print"},{"value":"9783031726989","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,10,26]],"date-time":"2024-10-26T00:00:00Z","timestamp":1729900800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,10,26]],"date-time":"2024-10-26T00:00:00Z","timestamp":1729900800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-72698-9_24","type":"book-chapter","created":{"date-parts":[[2024,10,25]],"date-time":"2024-10-25T04:45:57Z","timestamp":1729831557000},"page":"410-427","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["EAFormer: Scene Text Segmentation with\u00a0Edge-Aware Transformers"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2747-7338","authenticated-orcid":false,"given":"Haiyang","family":"Yu","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0009-8413-2185","authenticated-orcid":false,"given":"Teng","family":"Fu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9633-0033","authenticated-orcid":false,"given":"Bin","family":"Li","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4897-9209","authenticated-orcid":false,"given":"Xiangyang","family":"Xue","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,10,26]]},"reference":[{"issue":"1","key":"24_CR1","doi-asserted-by":"publisher","first-page":"60","DOI":"10.3390\/electronics11010060","volume":"11","author":"P Andreini","year":"2021","unstructured":"Andreini, P., et al.: A two-stage gan for high-resolution retinal image generation and segmentation. Electronics 11(1), 60 (2021)","journal-title":"Electronics"},{"key":"24_CR2","doi-asserted-by":"crossref","unstructured":"Bai, B., Yin, F., Liu, C.L.: A seed-based segmentation method for scene text extraction. In: 2014 11th IAPR International Workshop on Document Analysis Systems, pp. 262\u2013266. IEEE (2014)","DOI":"10.1109\/DAS.2014.34"},{"key":"24_CR3","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"238","DOI":"10.1007\/978-3-030-30508-6_20","volume-title":"Artificial Neural Networks and Machine Learning \u2013 ICANN 2019: Image Processing","author":"S Bonechi","year":"2019","unstructured":"Bonechi, S., Andreini, P., Bianchini, M., Scarselli, F.: COCO_TS dataset: pixel\u2013level annotations based on weak supervision for scene text segmentation. In: Tetko, I.V., K\u016frkov\u00e1, V., Karpov, P., Theis, F. (eds.) ICANN 2019. LNCS, vol. 11729, pp. 238\u2013250. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-30508-6_20"},{"key":"24_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.patrec.2020.06.023","volume":"138","author":"S Bonechi","year":"2020","unstructured":"Bonechi, S., Bianchini, M., Scarselli, F., Andreini, P.: Weak supervision for generating pixel-level annotations in scene text segmentation. Pattern Recogn. Lett. 138, 1\u20137 (2020)","journal-title":"Pattern Recogn. Lett."},{"key":"24_CR5","doi-asserted-by":"publisher","first-page":"679","DOI":"10.1109\/TPAMI.1986.4767851","volume":"6","author":"J Canny","year":"1986","unstructured":"Canny, J.: A computational approach to edge detection. IEEE Trans. Pattern Anal. Mach. Intell. 6, 679\u2013698 (1986)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"11","key":"24_CR6","doi-asserted-by":"publisher","first-page":"4513","DOI":"10.1109\/TGRS.2012.2194502","volume":"50","author":"J Chen","year":"2012","unstructured":"Chen, J., Li, J., Pan, D., Zhu, Q., Mao, Z.: Edge-guided multiscale segmentation of satellite multispectral imagery. IEEE Trans. Geosci. Remote Sens. 50(11), 4513\u20134520 (2012)","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"key":"24_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"833","DOI":"10.1007\/978-3-030-01234-2_49","volume-title":"Computer Vision \u2013 ECCV 2018","author":"L-C Chen","year":"2018","unstructured":"Chen, L.-C., Zhu, Y., Papandreou, G., Schroff, F., Adam, H.: Encoder-decoder with atrous separable convolution for semantic image segmentation. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11211, pp. 833\u2013851. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01234-2_49"},{"key":"24_CR8","doi-asserted-by":"crossref","unstructured":"Ch\u2019ng, C.K., Chan, C.S.: Total-text: a comprehensive dataset for scene text detection and recognition. In: 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR), vol.\u00a01, pp. 935\u2013942. IEEE (2017)","DOI":"10.1109\/ICDAR.2017.157"},{"issue":"4","key":"24_CR9","doi-asserted-by":"publisher","first-page":"376","DOI":"10.1109\/TCE.2022.3205376","volume":"68","author":"R Cong","year":"2022","unstructured":"Cong, R., Zhang, Y., Yang, N., Li, H., Zhang, X., Li, R., Chen, Z., Zhao, Y., Kwong, S.: Boundary guided semantic learning for real-time covid-19 lung infection segmentation system. IEEE Trans. Consum. Electron. 68(4), 376\u2013386 (2022)","journal-title":"IEEE Trans. Consum. Electron."},{"key":"24_CR10","doi-asserted-by":"crossref","unstructured":"Conrad, B., Chen, P.I.: Two-stage seamless text erasing on real-world scene images. In: 2021 IEEE International Conference on Image Processing (ICIP), pp. 1309\u20131313. IEEE (2021)","DOI":"10.1109\/ICIP42928.2021.9506394"},{"key":"24_CR11","doi-asserted-by":"crossref","unstructured":"Dai, Y., et al.: Fused text segmentation networks for multi-oriented scene text detection. In: 2018 24th International Conference on Pattern Recognition (ICPR), pp. 3604\u20133609. IEEE (2018)","DOI":"10.1109\/ICPR.2018.8546066"},{"key":"24_CR12","doi-asserted-by":"crossref","unstructured":"Du, X., Zhou, Z., Zheng, Y., Ma, T., Wu, X., Jin, C.: Modeling stroke mask for end-to-end text erasing. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 6151\u20136159 (2023)","DOI":"10.1109\/WACV56688.2023.00609"},{"key":"24_CR13","doi-asserted-by":"crossref","unstructured":"Ess, A., M\u00fcller, T., Grabner, H., Van\u00a0Gool, L.: Segmentation-based urban traffic scene understanding. In: BMVC, vol.\u00a01, p.\u00a02. Citeseer (2009)","DOI":"10.5244\/C.23.84"},{"issue":"6","key":"24_CR14","doi-asserted-by":"publisher","first-page":"2547","DOI":"10.1109\/TNNLS.2020.3006524","volume":"32","author":"J Fu","year":"2020","unstructured":"Fu, J., Liu, J., Jiang, J., Li, Y., Bao, Y., Lu, H.: Scene segmentation with dual relation-aware attention network. IEEE Trans. Neural Networks Learn. Syst. 32(6), 2547\u20132560 (2020)","journal-title":"IEEE Trans. Neural Networks Learn. Syst."},{"issue":"7","key":"24_CR15","doi-asserted-by":"publisher","first-page":"1079","DOI":"10.1109\/5.156471","volume":"80","author":"H Fujisawa","year":"1992","unstructured":"Fujisawa, H., Nakano, Y., Kurino, K.: Segmentation methods for character recognition: from segmentation to document structure analysis. Proc. IEEE 80(7), 1079\u20131092 (1992)","journal-title":"Proc. IEEE"},{"key":"24_CR16","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"24_CR17","doi-asserted-by":"crossref","unstructured":"He, W., Zhang, X.Y., Yin, F., Liu, C.L.: Deep direct regression for multi-oriented scene text detection. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 745\u2013753 (2017)","DOI":"10.1109\/ICCV.2017.87"},{"issue":"11","key":"24_CR18","doi-asserted-by":"publisher","first-page":"5406","DOI":"10.1109\/TIP.2018.2855399","volume":"27","author":"W He","year":"2018","unstructured":"He, W., Zhang, X.Y., Yin, F., Liu, C.L.: Multi-oriented and multi-lingual scene text detection with direct regression. IEEE Trans. Image Process. 27(11), 5406\u20135419 (2018)","journal-title":"IEEE Trans. Image Process."},{"key":"24_CR19","doi-asserted-by":"crossref","unstructured":"Karatzas, D., et al.: Icdar 2013 robust reading competition. In: 2013 12th International Conference on Document Analysis and Recognition, pp. 1484\u20131493. IEEE (2013)","DOI":"10.1109\/ICDAR.2013.221"},{"key":"24_CR20","doi-asserted-by":"crossref","unstructured":"Liao, M., Wan, Z., Yao, C., Chen, K., Bai, X.: Real-time scene text detection with differentiable binarization. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol.\u00a034, pp. 11474\u201311481 (2020)","DOI":"10.1609\/aaai.v34i07.6812"},{"key":"24_CR21","doi-asserted-by":"crossref","unstructured":"Liu, X., Samarabandu, J.: Multiscale edge-based text extraction from complex images. In: 2006 IEEE International Conference on Multimedia and Expo, pp. 1721\u20131724. IEEE (2006)","DOI":"10.1109\/ICME.2006.262882"},{"issue":"6","key":"24_CR22","doi-asserted-by":"publisher","first-page":"1353","DOI":"10.3390\/rs14061353","volume":"14","author":"Z Liu","year":"2022","unstructured":"Liu, Z., Li, J., Song, R., Wu, C., Liu, W., Li, Z., Li, Y.: Edge guided context aggregation network for semantic segmentation of remote sensing imagery. Remote Sensing 14(6), 1353 (2022)","journal-title":"Remote Sensing"},{"key":"24_CR23","unstructured":"Loshchilov, I., Hutter, F.: Decoupled weight decay regularization. In: International Conference on Learning Representations (2018)"},{"key":"24_CR24","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.109531","volume":"140","author":"G Lyu","year":"2023","unstructured":"Lyu, G., Liu, K., Zhu, A., Uchida, S., Iwana, B.K.: Fetnet: feature erasing and transferring network for scene text removal. Pattern Recogn. 140, 109531 (2023)","journal-title":"Pattern Recogn."},{"key":"24_CR25","doi-asserted-by":"crossref","unstructured":"Lyu, P., Yao, C., Wu, W., Yan, S., Bai, X.: Multi-oriented scene text detection via corner localization and region segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7553\u20137563 (2018)","DOI":"10.1109\/CVPR.2018.00788"},{"key":"24_CR26","unstructured":"Ma, H., Yang, H., Huang, D.: Boundary guided context aggregation for semantic segmentation. arXiv preprint arXiv:2110.14587 (2021)"},{"issue":"11","key":"24_CR27","doi-asserted-by":"publisher","first-page":"3111","DOI":"10.1109\/TMM.2018.2818020","volume":"20","author":"J Ma","year":"2018","unstructured":"Ma, J., Shao, W., Ye, H., Wang, L., Wang, H., Zheng, Y., Xue, X.: Arbitrary-oriented scene text detection via rotation proposals. IEEE Trans. Multimedia 20(11), 3111\u20133122 (2018)","journal-title":"IEEE Trans. Multimedia"},{"key":"24_CR28","doi-asserted-by":"crossref","unstructured":"Ma, J., Jin, L., Zhang, J., Jiang, J., Xue, Y., He, M.: Textsrnet: scene text super-resolution based on contour prior and atrous convolution. In: 2022 26th International Conference on Pattern Recognition (ICPR), pp. 3252\u20133258. IEEE (2022)","DOI":"10.1109\/ICPR56361.2022.9956491"},{"key":"24_CR29","doi-asserted-by":"crossref","unstructured":"Mustafa, W.A., Kader, M.M.M.A.: Binarization of document image using optimum threshold modification. In: Journal of Physics: Conference Series, vol.\u00a01019, p. 012022. IOP Publishing (2018)","DOI":"10.1088\/1742-6596\/1019\/1\/012022"},{"issue":"1","key":"24_CR30","doi-asserted-by":"publisher","first-page":"62","DOI":"10.1109\/TSMC.1979.4310076","volume":"9","author":"N Otsu","year":"1979","unstructured":"Otsu, N.: A threshold selection method from gray-level histograms. IEEE Trans. Syst. Man Cybern. 9(1), 62\u201366 (1979)","journal-title":"IEEE Trans. Syst. Man Cybern."},{"key":"24_CR31","doi-asserted-by":"crossref","unstructured":"Pack, C., Soh, L.K., Lorang, E.: Perceptual cue-guided adaptive image downscaling for enhanced semantic segmentation on large document images. Int. J. Document Anal. Recogn. (IJDAR), 1\u201317 (2023)","DOI":"10.1007\/s10032-023-00454-7"},{"key":"24_CR32","doi-asserted-by":"crossref","unstructured":"Ren, Y., Zhang, J., Chen, B., Zhang, X., Jin, L.: Looking from a higher-level perspective: attention and recognition enhanced multi-scale scene text segmentation. In: Proceedings of the Asian Conference on Computer Vision, pp. 3138\u20133154 (2022)","DOI":"10.1007\/978-3-031-26293-7_38"},{"issue":"2","key":"24_CR33","doi-asserted-by":"publisher","first-page":"225","DOI":"10.1016\/S0031-3203(99)00055-2","volume":"33","author":"J Sauvola","year":"2000","unstructured":"Sauvola, J., Pietik\u00e4inen, M.: Adaptive document image binarization. Pattern Recogn. 33(2), 225\u2013236 (2000)","journal-title":"Pattern Recogn."},{"key":"24_CR34","doi-asserted-by":"crossref","unstructured":"Shi, B., Bai, X., Belongie, S.: Detecting oriented text in natural images by linking segments. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2550\u20132558 (2017)","DOI":"10.1109\/CVPR.2017.371"},{"key":"24_CR35","doi-asserted-by":"crossref","unstructured":"Shu, R., Zhao, C., Feng, S., Zhu, L., Miao, D.: Text-enhanced scene image super-resolution via stroke mask and orthogonal attention. IEEE Trans. Circuits Syst. Video Technol. (2023)","DOI":"10.1109\/TCSVT.2023.3267133"},{"key":"24_CR36","doi-asserted-by":"crossref","unstructured":"Su, B., Lu, S., Tan, C.L.: Binarization of historical document images using the local maximum and minimum. In: Proceedings of the 9th IAPR International Workshop on Document Analysis Systems, pp. 159\u2013166 (2010)","DOI":"10.1145\/1815330.1815351"},{"key":"24_CR37","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2019.06.020","volume":"96","author":"J Tang","year":"2019","unstructured":"Tang, J., Yang, Z., Wang, Y., Zheng, Q., Xu, Y., Bai, X.: Seglink++: detecting dense and arbitrary-shaped scene text by instance-aware component grouping. Pattern Recogn. 96, 106954 (2019)","journal-title":"Pattern Recogn."},{"issue":"3","key":"24_CR38","doi-asserted-by":"publisher","first-page":"1509","DOI":"10.1109\/TIP.2017.2656474","volume":"26","author":"Y Tang","year":"2017","unstructured":"Tang, Y., Wu, X.: Scene text detection and segmentation based on cascaded convolution neural networks. IEEE Trans. Image Process. 26(3), 1509\u20131520 (2017)","journal-title":"IEEE Trans. Image Process."},{"key":"24_CR39","doi-asserted-by":"publisher","first-page":"568","DOI":"10.1016\/j.patcog.2017.08.025","volume":"74","author":"QN Vo","year":"2018","unstructured":"Vo, Q.N., Kim, S.H., Yang, H.J., Lee, G.: Binarization of degraded document images based on hierarchical deep supervised network. Pattern Recogn. 74, 568\u2013586 (2018)","journal-title":"Pattern Recogn."},{"issue":"10","key":"24_CR40","doi-asserted-by":"publisher","first-page":"3349","DOI":"10.1109\/TPAMI.2020.2983686","volume":"43","author":"J Wang","year":"2020","unstructured":"Wang, J., Sun, K., Cheng, T., Jiang, B., Deng, C., Zhao, Y., Liu, D., Mu, Y., Tan, M., Wang, X., et al.: Deep high-resolution representation learning for visual recognition. IEEE Trans. Pattern Anal. Mach. Intell. 43(10), 3349\u20133364 (2020)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"24_CR41","doi-asserted-by":"crossref","unstructured":"Wang, X., Wu, C., Yu, H., Li, B., Xue, X.: Textformer: component-aware text segmentation with transformer. In: 2023 IEEE International Conference on Multimedia and Expo (ICME), pp. 1877\u20131882. IEEE (2023)","DOI":"10.1109\/ICME55011.2023.00322"},{"key":"24_CR42","doi-asserted-by":"crossref","unstructured":"Wu, Y., Natarajan, P., Rawls, S., AbdAlmageed, W.: Learning document image binarization from data. In: 2016 IEEE International Conference on Image Processing (ICIP), pp. 3763\u20133767. IEEE (2016)","DOI":"10.1109\/ICIP.2016.7533063"},{"key":"24_CR43","first-page":"12077","volume":"34","author":"E Xie","year":"2021","unstructured":"Xie, E., Wang, W., Yu, Z., Anandkumar, A., Alvarez, J.M., Luo, P.: Segformer: simple and efficient design for semantic segmentation with transformers. Adv. Neural. Inf. Process. Syst. 34, 12077\u201312090 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"24_CR44","doi-asserted-by":"crossref","unstructured":"Xu, X., Zhang, Z., Wang, Z., Price, B., Wang, Z., Shi, H.: Rethinking text segmentation: a novel dataset and a text-specific refinement approach. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12045\u201312055 (2021)","DOI":"10.1109\/CVPR46437.2021.01187"},{"key":"24_CR45","doi-asserted-by":"crossref","unstructured":"Xu, X., Qi, Z., Ma, J., Zhang, H., Shan, Y., Qie, X.: Bts: a bi-lingual benchmark for text segmentation in the wild. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 19152\u201319162 (2022)","DOI":"10.1109\/CVPR52688.2022.01856"},{"issue":"4","key":"24_CR46","doi-asserted-by":"publisher","first-page":"1093","DOI":"10.3390\/rs15041093","volume":"15","author":"X Yin","year":"2023","unstructured":"Yin, X., Li, X., Ni, P., Xu, Q., Kong, D.: A novel real-time edge-guided lidar semantic segmentation network for unstructured environments. Remote Sensing 15(4), 1093 (2023)","journal-title":"Remote Sensing"},{"key":"24_CR47","doi-asserted-by":"crossref","unstructured":"Yu, C., Wang, J., Gao, C., Yu, G., Shen, C., Sang, N.: Context prior for scene segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12416\u201312425 (2020)","DOI":"10.1109\/CVPR42600.2020.01243"},{"key":"24_CR48","doi-asserted-by":"crossref","unstructured":"Yu, H., Wang, X., Niu, K., Li, B., Xue, X.: Scene text segmentation with text-focused transformers. In: Proceedings of the 31st ACM International Conference on Multimedia, pp. 2898\u20132907 (2023)","DOI":"10.1145\/3581783.3611755"},{"key":"24_CR49","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"173","DOI":"10.1007\/978-3-030-58539-6_11","volume-title":"Computer Vision \u2013 ECCV 2020","author":"Y Yuan","year":"2020","unstructured":"Yuan, Y., Chen, X., Wang, J.: Object-contextual representations for semantic segmentation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12351, pp. 173\u2013190. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58539-6_11"},{"key":"24_CR50","doi-asserted-by":"crossref","unstructured":"Zdenek, J., Nakayama, H.: Erasing scene text with weak supervision. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 2238\u20132246 (2020)","DOI":"10.1109\/WACV45572.2020.9093544"},{"key":"24_CR51","doi-asserted-by":"crossref","unstructured":"Zhao, H., Shi, J., Qi, X., Wang, X., Jia, J.: Pyramid scene parsing network. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2881\u20132890 (2017)","DOI":"10.1109\/CVPR.2017.660"},{"key":"24_CR52","doi-asserted-by":"crossref","unstructured":"Zheng, S., et\u00a0al.: Rethinking semantic segmentation from a sequence-to-sequence perspective with transformers. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6881\u20136890 (2021)","DOI":"10.1109\/CVPR46437.2021.00681"},{"key":"24_CR53","doi-asserted-by":"crossref","unstructured":"Zhou, X., Yao, C., Wen, H., Wang, Y., Zhou, S., He, W., Liang, J.: East: an efficient and accurate scene text detector. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5551\u20135560 (2017)","DOI":"10.1109\/CVPR.2017.283"},{"key":"24_CR54","doi-asserted-by":"crossref","unstructured":"Zhou, Y., Feild, J., Learned-Miller, E., Wang, R.: Scene text segmentation via inverse rendering. In: 2013 12th International Conference on Document Analysis and Recognition, pp. 457\u2013461. IEEE (2013)","DOI":"10.1109\/ICDAR.2013.98"},{"key":"24_CR55","doi-asserted-by":"crossref","unstructured":"Zu, X., Yu, H., Li, B., Xue, X.: Weakly-supervised text instance segmentation. In: Proceedings of the 31st ACM International Conference on Multimedia, pp. 1915\u20131923 (2023)","DOI":"10.1145\/3581783.3612243"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-72698-9_24","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,25]],"date-time":"2024-10-25T04:53:44Z","timestamp":1729832024000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-72698-9_24"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,26]]},"ISBN":["9783031726972","9783031726989"],"references-count":55,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-72698-9_24","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,10,26]]},"assertion":[{"value":"26 October 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}