{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,10]],"date-time":"2026-04-10T07:45:03Z","timestamp":1775807103250,"version":"3.50.1"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T00:00:00Z","timestamp":1750291200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T00:00:00Z","timestamp":1750291200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62172417"],"award-info":[{"award-number":["62172417"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62272461"],"award-info":[{"award-number":["62272461"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62276266"],"award-info":[{"award-number":["62276266"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Xuzhou Key Research and Development Program","award":["KC22287"],"award-info":[{"award-number":["KC22287"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["IJDAR"],"published-print":{"date-parts":[[2026,3]]},"DOI":"10.1007\/s10032-025-00539-5","type":"journal-article","created":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T00:09:34Z","timestamp":1750291774000},"page":"175-189","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Few-Shot Quaternion-valued Correlation Squeeze Network for Document Image Layout Segmentation"],"prefix":"10.1007","volume":"29","author":[{"given":"Rui","family":"Yao","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qiwei","family":"Yu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Songhui","family":"Zhao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yuxuan","family":"Yang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yong","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bing","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,6,19]]},"reference":[{"key":"539_CR1","doi-asserted-by":"crossref","unstructured":"Antonacopoulos, A., Bridson, D., Papadopoulos, C., et\u00a0al.: A realistic dataset for performance evaluation of document layout analysis. In: 2009 10th International Conference on Document Analysis and Recognition, IEEE, pp 296\u2013300 (2009)","DOI":"10.1109\/ICDAR.2009.271"},{"key":"539_CR2","doi-asserted-by":"crossref","unstructured":"Arroyo, D.M., Postels, J., Tombari, F.: Variational transformer networks for layout generation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 13642\u201313652 (2021)","DOI":"10.1109\/CVPR46437.2021.01343"},{"issue":"12","key":"539_CR3","doi-asserted-by":"publisher","first-page":"2481","DOI":"10.1109\/TPAMI.2016.2644615","volume":"39","author":"V Badrinarayanan","year":"2017","unstructured":"Badrinarayanan, V., Kendall, A., Cipolla, R.: Segnet: A deep convolutional encoder-decoder architecture for image segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 39(12), 2481\u20132495 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"6","key":"539_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3355610","volume":"52","author":"GM Binmakhashen","year":"2019","unstructured":"Binmakhashen, G.M., Mahmoud, S.A.: Document layout analysis: a comprehensive survey. ACM Computing Surveys (CSUR) 52(6), 1\u201336 (2019)","journal-title":"ACM Computing Surveys (CSUR)"},{"issue":"4","key":"539_CR5","doi-asserted-by":"publisher","first-page":"834","DOI":"10.1109\/TPAMI.2017.2699184","volume":"40","author":"LC Chen","year":"2017","unstructured":"Chen, L.C., Papandreou, G., Kokkinos, I., et al.: Deeplab: Semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected crfs. IEEE Trans. Pattern Anal. Mach. Intell. 40(4), 834\u2013848 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"539_CR6","unstructured":"Finn, C., Abbeel, P., Levine, S.: Model-agnostic meta-learning for fast adaptation of deep networks. In: International conference on machine learning, PMLR, pp 1126\u20131135 (2017)"},{"key":"539_CR7","doi-asserted-by":"crossref","unstructured":"Grassucci, E., Cicero, E., Comminiello, D.: Quaternion generative adversarial networks. In: Generative Adversarial Learning: Architectures and Applications. Springer, p 57\u201386 (2022)","DOI":"10.1007\/978-3-030-91390-8_4"},{"key":"539_CR8","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., et\u00a0al.: Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"539_CR9","unstructured":"Ioffe, S., Szegedy, C.: Batch normalization: Accelerating deep network training by reducing internal covariate shift. In: International conference on machine learning, pmlr, pp 448\u2013456 (2015)"},{"issue":"9","key":"539_CR10","doi-asserted-by":"publisher","first-page":"2478","DOI":"10.1109\/TMM.2018.2798282","volume":"20","author":"B Kang","year":"2018","unstructured":"Kang, B., Lee, Y., Nguyen, T.Q.: Depth-adaptive deep neural network for semantic segmentation. IEEE Trans. Multimedia 20(9), 2478\u20132490 (2018)","journal-title":"IEEE Trans. Multimedia"},{"key":"539_CR11","unstructured":"Kingma, D.P., Ba, J.: Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)"},{"key":"539_CR12","doi-asserted-by":"crossref","unstructured":"Lang, C., Cheng, G., Tu, B., et\u00a0al.: Learning what not to segment: A new perspective on few-shot segmentation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 8057\u20138067 (2022)","DOI":"10.1109\/CVPR52688.2022.00789"},{"key":"539_CR13","doi-asserted-by":"crossref","unstructured":"Lei, S., Zhang, X., He, J., et\u00a0al.: Cross-domain few-shot semantic segmentation. In: European Conference on Computer Vision, Springer, pp 73\u201390 (2022)","DOI":"10.1007\/978-3-031-20056-4_5"},{"key":"539_CR14","doi-asserted-by":"crossref","unstructured":"Li, Y., Zou, Y., Ma, J.: Deeplayout: A semantic segmentation approach to page layout analysis. In: Intelligent Computing Methodologies: 14th International Conference, ICIC 2018, Wuhan, China, August 15-18, 2018, Proceedings, Part III 14, Springer, pp 266\u2013277 (2018)","DOI":"10.1007\/978-3-319-95957-3_30"},{"key":"539_CR15","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2021.107882","volume":"115","author":"Y Li","year":"2021","unstructured":"Li, Y., Zhang, P., Xu, X., et al.: Few-shot prototype alignment regularization network for document image layout segmentation. Pattern Recogn. 115, 107882 (2021)","journal-title":"Pattern Recogn."},{"key":"539_CR16","doi-asserted-by":"crossref","unstructured":"Liu, B., Ding, Y., Jiao, J., et\u00a0al.: Anti-aliasing semantic reconstruction for few-shot semantic segmentation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 9747\u20139756 (2021)","DOI":"10.1109\/CVPR46437.2021.00962"},{"key":"539_CR17","doi-asserted-by":"publisher","first-page":"8580","DOI":"10.1109\/TMM.2023.3238521","volume":"25","author":"H Liu","year":"2023","unstructured":"Liu, H., Peng, P., Chen, T., et al.: Fecanet: Boosting few-shot semantic segmentation with feature-enhanced context-aware network. IEEE Trans. Multimedia 25, 8580\u20138592 (2023)","journal-title":"IEEE Trans. Multimedia"},{"key":"539_CR18","doi-asserted-by":"crossref","unstructured":"Liu, Y., Zhang, X., Zhang, S., et\u00a0al.: Part-aware prototype network for few-shot semantic segmentation. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part IX 16, Springer, pp 142\u2013158 (2020)","DOI":"10.1007\/978-3-030-58545-7_9"},{"key":"539_CR19","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., Darrell, T.: Fully convolutional networks for semantic segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3431\u20133440 (2015)","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"539_CR20","doi-asserted-by":"crossref","unstructured":"Mehri, M., Nayef, N., H\u00e9roux, P., et\u00a0al.: Learning texture features for enhancement and segmentation of historical document images. In: Proceedings of the 3rd International Workshop on Historical Document Imaging and Processing, pp 47\u201354 (2015)","DOI":"10.1145\/2809544.2809545"},{"key":"539_CR21","doi-asserted-by":"crossref","unstructured":"Min, J., Kang, D., Cho, M.: Hypercorrelation squeeze for few-shot segmentation. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 6941\u20136952 (2021)","DOI":"10.1109\/ICCV48922.2021.00686"},{"key":"539_CR22","doi-asserted-by":"crossref","unstructured":"Noh, H., Hong, S., Han, B.: Learning deconvolution network for semantic segmentation. In: Proceedings of the IEEE international conference on computer vision, pp 1520\u20131528 (2015)","DOI":"10.1109\/ICCV.2015.178"},{"issue":"11","key":"539_CR23","doi-asserted-by":"publisher","first-page":"1162","DOI":"10.1109\/34.244677","volume":"15","author":"L O\u2019Gorman","year":"1993","unstructured":"O\u2019Gorman, L.: The document spectrum for page layout analysis. IEEE Trans. Pattern Anal. Mach. Intell. 15(11), 1162\u20131173 (1993)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"539_CR24","doi-asserted-by":"publisher","first-page":"260","DOI":"10.1016\/j.patcog.2015.10.021","volume":"52","author":"D Rav\u00ec","year":"2016","unstructured":"Rav\u00ec, D., Bober, M., Farinella, G.M., et al.: Semantic segmentation of images exploiting dct based features and random forest. Pattern Recogn. 52, 260\u2013273 (2016)","journal-title":"Pattern Recogn."},{"key":"539_CR25","doi-asserted-by":"crossref","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-net: Convolutional networks for biomedical image segmentation. In: Medical image computing and computer-assisted intervention\u2013MICCAI 2015: 18th international conference, Munich, Germany, October 5-9, 2015, proceedings, part III 18, Springer, pp 234\u2013241 (2015)","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"539_CR26","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky, O., Deng, J., Su, H., et al.: Imagenet large scale visual recognition challenge. Int. J. Comput. Vision 115, 211\u2013252 (2015)","journal-title":"Int. J. Comput. Vision"},{"key":"539_CR27","doi-asserted-by":"crossref","unstructured":"Shaban, A., Bansal, S., Liu, Z., et\u00a0al.: One-shot learning for semantic segmentation. arXiv preprint arXiv:1709.03410 (2017)","DOI":"10.5244\/C.31.167"},{"key":"539_CR28","unstructured":"Snell, J., Swersky, K., Zemel, R.: Prototypical networks for few-shot learning. Advances in neural information processing systems 30 (2017)"},{"key":"539_CR29","doi-asserted-by":"crossref","unstructured":"Sun, K., Xiao, B., Liu, D., et\u00a0al.: Deep high-resolution representation learning for human pose estimation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 5693\u20135703 (2019)","DOI":"10.1109\/CVPR.2019.00584"},{"key":"539_CR30","doi-asserted-by":"crossref","unstructured":"Sung, F., Yang, Y., Zhang, L., et\u00a0al.: Learning to compare: Relation network for few-shot learning. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1199\u20131208 (2018)","DOI":"10.1109\/CVPR.2018.00131"},{"issue":"2","key":"539_CR31","doi-asserted-by":"publisher","first-page":"214","DOI":"10.1016\/j.sigpro.2010.06.024","volume":"91","author":"CC Took","year":"2011","unstructured":"Took, C.C., Mandic, D.P.: Augmented second-order statistics of quaternion random signals. Signal Process. 91(2), 214\u2013224 (2011)","journal-title":"Signal Process."},{"key":"539_CR32","unstructured":"Vinyals, O., Blundell, C., Lillicrap, T., et\u00a0al.: Matching networks for one shot learning. Advances in neural information processing systems 29 (2016)"},{"key":"539_CR33","doi-asserted-by":"crossref","unstructured":"Wang, H., Zhang, X., Hu, Y., et\u00a0al.: Few-shot semantic segmentation with democratic attention networks. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XIII 16, Springer, pp 730\u2013746 (2020)","DOI":"10.1007\/978-3-030-58601-0_43"},{"key":"539_CR34","doi-asserted-by":"crossref","unstructured":"Wang, K., Liew, J.H., Zou, Y., et\u00a0al.: Panet: Few-shot image semantic segmentation with prototype alignment. In: proceedings of the IEEE\/CVF international conference on computer vision, pp 9197\u20139206 (2019)","DOI":"10.1109\/ICCV.2019.00929"},{"key":"539_CR35","doi-asserted-by":"crossref","unstructured":"Wick, C., Puppe, F.: Fully convolutional neural networks for page segmentation of historical document images. In: 2018 13th IAPR International Workshop on Document Analysis Systems (DAS), IEEE, pp 287\u2013292 (2018)","DOI":"10.1109\/DAS.2018.39"},{"key":"539_CR36","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, J.Y., et\u00a0al.: Cbam: Convolutional block attention module. In: Proceedings of the European conference on computer vision (ECCV), pp 3\u201319 (2018)","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"539_CR37","doi-asserted-by":"publisher","first-page":"3427","DOI":"10.1109\/TMM.2020.3025696","volume":"23","author":"X Wu","year":"2020","unstructured":"Wu, X., Chen, Q., Xiao, Y., et al.: Lcsegnet: An efficient semantic segmentation network for large-scale complex chinese character recognition. IEEE Trans. Multimedia 23, 3427\u20133440 (2020)","journal-title":"IEEE Trans. Multimedia"},{"issue":"3","key":"539_CR38","doi-asserted-by":"publisher","DOI":"10.1016\/j.ipm.2023.103339","volume":"60","author":"X Wu","year":"2023","unstructured":"Wu, X., Ma, T., Du, X., et al.: Drfn: A unified framework for complex document layout analysis. Information Processing & Management 60(3), 103339 (2023)","journal-title":"Information Processing & Management"},{"key":"539_CR39","doi-asserted-by":"crossref","unstructured":"Wu, Y., He, K.: Group normalization. In: Proceedings of the European conference on computer vision (ECCV), pp 3\u201319 (2018)","DOI":"10.1007\/978-3-030-01261-8_1"},{"key":"539_CR40","doi-asserted-by":"crossref","unstructured":"Xu, Y., Li, M., Cui, L., et\u00a0al.: Layoutlm: Pre-training of text and layout for document image understanding. In: Proceedings of the 26th ACM SIGKDD international conference on knowledge discovery & data mining, pp 1192\u20131200 (2020)","DOI":"10.1145\/3394486.3403172"},{"issue":"3","key":"539_CR41","doi-asserted-by":"publisher","first-page":"676","DOI":"10.1109\/TMM.2019.2932566","volume":"22","author":"B Yan","year":"2019","unstructured":"Yan, B., Niu, X., Bare, B., et al.: Semantic segmentation guided pixel fusion for image retargeting. IEEE Trans. Multimedia 22(3), 676\u2013687 (2019)","journal-title":"IEEE Trans. Multimedia"},{"issue":"12","key":"539_CR42","doi-asserted-by":"publisher","first-page":"3389","DOI":"10.1109\/TMM.2018.2838320","volume":"20","author":"C Yan","year":"2018","unstructured":"Yan, C., Xie, H., Chen, J., et al.: A fast uyghur text detector for complex background images. IEEE Trans. Multimedia 20(12), 3389\u20133398 (2018)","journal-title":"IEEE Trans. Multimedia"},{"key":"539_CR43","doi-asserted-by":"crossref","unstructured":"Yang, B., Liu, C., Li, B., et\u00a0al.: Prototype mixture models for few-shot semantic segmentation. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part VIII 16, Springer, pp 763\u2013778 (2020)","DOI":"10.1007\/978-3-030-58598-3_45"},{"key":"539_CR44","unstructured":"Yang, L., Zhang, R.Y., Li, L., et\u00a0al.: Simam: A simple, parameter-free attention module for convolutional neural networks. In: International conference on machine learning, PMLR, pp 11863\u201311874 (2021)"},{"key":"539_CR45","doi-asserted-by":"crossref","unstructured":"Yang, X., Yumer, E., Asente, P., et\u00a0al.: Learning to extract semantic structure from documents using multimodal fully convolutional neural networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 5315\u20135324 (2017)","DOI":"10.1109\/CVPR.2017.462"},{"key":"539_CR46","doi-asserted-by":"crossref","unstructured":"Zhang, C., Lin, G., Liu, F., et\u00a0al.: Pyramid graph networks with connection attentions for region-based one-shot semantic segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 9587\u20139595 (2019)","DOI":"10.1109\/ICCV.2019.00968"},{"key":"539_CR47","doi-asserted-by":"crossref","unstructured":"Zhang, C., Lin, G., Liu, F., et\u00a0al.: Canet: Class-agnostic segmentation networks with iterative refinement and attentive few-shot learning. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 5217\u20135226 (2019)","DOI":"10.1109\/CVPR.2019.00536"},{"issue":"9","key":"539_CR48","doi-asserted-by":"publisher","first-page":"3855","DOI":"10.1109\/TCYB.2020.2992433","volume":"50","author":"X Zhang","year":"2020","unstructured":"Zhang, X., Wei, Y., Yang, Y., et al.: Sg-one: Similarity guidance network for one-shot semantic segmentation. IEEE transactions on cybernetics 50(9), 3855\u20133865 (2020)","journal-title":"IEEE transactions on cybernetics"},{"key":"539_CR49","doi-asserted-by":"crossref","unstructured":"Zhao, H., Shi, J., Qi, X., et\u00a0al.: Pyramid scene parsing network. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 2881\u20132890 (2017)","DOI":"10.1109\/CVPR.2017.660"},{"issue":"5","key":"539_CR50","doi-asserted-by":"publisher","first-page":"2102","DOI":"10.1109\/TCSVT.2022.3223150","volume":"33","author":"Z Zheng","year":"2022","unstructured":"Zheng, Z., Huang, G., Yuan, X., et al.: Quaternion-valued correlation learning for few-shot semantic segmentation. IEEE Trans. Circuits Syst. Video Technol. 33(5), 2102\u20132115 (2022)","journal-title":"IEEE Trans. Circuits Syst. Video Technol."}],"container-title":["International Journal on Document Analysis and Recognition (IJDAR)"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10032-025-00539-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10032-025-00539-5","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10032-025-00539-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,10]],"date-time":"2026-04-10T06:49:44Z","timestamp":1775803784000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10032-025-00539-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,19]]},"references-count":50,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,3]]}},"alternative-id":["539"],"URL":"https:\/\/doi.org\/10.1007\/s10032-025-00539-5","relation":{},"ISSN":["1433-2833","1433-2825"],"issn-type":[{"value":"1433-2833","type":"print"},{"value":"1433-2825","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,6,19]]},"assertion":[{"value":"4 September 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 March 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 June 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 June 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest\/Competing interests"}}]}}