{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,9]],"date-time":"2026-06-09T07:04:52Z","timestamp":1780988692014,"version":"3.54.1"},"reference-count":47,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,12,7]],"date-time":"2025-12-07T00:00:00Z","timestamp":1765065600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,12,7]],"date-time":"2025-12-07T00:00:00Z","timestamp":1765065600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"name":"Guangdong Provincial Natural Science Foundation General Project","award":["2024A1515011971"],"award-info":[{"award-number":["2024A1515011971"]}]},{"name":"Special Project for Key Fields in Higher Education of Guangdong, China","award":["2022ZDZX1013\uff0c2023ZDZX1008"],"award-info":[{"award-number":["2022ZDZX1013\uff0c2023ZDZX1008"]}]},{"name":"Guangdong Provincial Key Laboratory of Intellectual Property and Big Data","award":["2018B030322016"],"award-info":[{"award-number":["2018B030322016"]}]},{"name":"Key Discipline Research Capacity Improvement Project of Guangdong Province","award":["2022ZDJS013"],"award-info":[{"award-number":["2022ZDJS013"]}]},{"name":"Key Discipline Research Capacity Improvement Project of Guangdong Province","award":["2024ZDJS022"],"award-info":[{"award-number":["2024ZDJS022"]}]},{"name":"Guangdong Provincial Science and Technology Project","award":["KTP20210197"],"award-info":[{"award-number":["KTP20210197"]}]},{"DOI":"10.13039\/100019024","name":"Guangdong Polytechnic Normal University","doi-asserted-by":"publisher","award":["22GPNUZDJS16"],"award-info":[{"award-number":["22GPNUZDJS16"]}],"id":[{"id":"10.13039\/100019024","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2026,1]]},"DOI":"10.1007\/s00371-025-04256-2","type":"journal-article","created":{"date-parts":[[2025,12,7]],"date-time":"2025-12-07T15:38:18Z","timestamp":1765121898000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Local feature enhancement for robust 2D multi-person pose estimation via pose refinement network"],"prefix":"10.1007","volume":"42","author":[{"given":"Weili","family":"Tian","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jin","family":"Zhan","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Zhaokang","family":"Guan","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Chensheng","family":"Yi","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Fangyuan","family":"Lei","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Xiaoyong","family":"Liu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Huihui","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yufeng","family":"Zeng","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,12,7]]},"reference":[{"key":"4256_CR1","doi-asserted-by":"crossref","unstructured":"Sun, K., Xiao, B., Liu, D.: Deep high-resolution representation learning for human pose estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 5693\u20135703 (2019)","DOI":"10.1109\/CVPR.2019.00584"},{"key":"4256_CR2","doi-asserted-by":"crossref","unstructured":"Bras\u00f3, G., Kister, N., Leal-Taix\u00e9, L.: The center of attention: Center-keypoints grouping via attention for multi-person pose estimation. In: Proceedings of the IEEE International Conference on Computer Vision (ICCV), pp. 11853\u201311863 (2021)","DOI":"10.1109\/ICCV48922.2021.01164"},{"key":"4256_CR3","unstructured":"Li, W., Wang, Z., Yin, B.: Rethinking on multi-stage networks for human pose estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 1901.00148 (2019)"},{"key":"4256_CR4","doi-asserted-by":"crossref","unstructured":"He, K., Gkioxari, G., Doll\u00e1r, P.: Mask r-cnn. In: Proceedings of the IEEE International Conference on Computer Vision (ICCV), pp. 2961\u20132969 (2017)","DOI":"10.1109\/ICCV.2017.322"},{"key":"4256_CR5","doi-asserted-by":"crossref","unstructured":"Chen, Y., Wang, Z., Peng, Y.: Cascaded pyramid network for multi-person pose estimation. In: Proceedings of the IEEE Conference On Computer Vision and Pattern Recognition (CVPR), pp. 7103\u20137112 (2018)","DOI":"10.1109\/CVPR.2018.00742"},{"key":"4256_CR6","doi-asserted-by":"crossref","unstructured":"Ning, G., Pei, J., Huang, H.: Lighttrack: A generic framework for online top-down human pose tracking. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CCPR), pp. 1034\u20131035 (2020)","DOI":"10.1109\/CVPRW50498.2020.00525"},{"key":"4256_CR7","unstructured":"Tian, Z., Chen, H., Shen, C.: Directpose: Direct end-to-end multi-person pose estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 1911.07451 (2019)"},{"key":"4256_CR8","doi-asserted-by":"crossref","unstructured":"Zhang, F., Zhu, X., Ye, M.: Fast human pose estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 3517\u20133526 (2019)","DOI":"10.1109\/CVPR.2019.00363"},{"key":"4256_CR9","unstructured":"Newell, A., Huang, Z., Deng, J.: Associative embedding: End-to-end learning for joint detection and grouping. Adv. Neural Inf. Process. Syst., 30 (2017)"},{"key":"4256_CR10","doi-asserted-by":"crossref","unstructured":"Kocabas, M., Karagoz, S., Akbas, E.: Multiposenet: Fast multi-person pose estimation using pose residual network. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 417\u2013433 (2018)","DOI":"10.1007\/978-3-030-01252-6_26"},{"key":"4256_CR11","doi-asserted-by":"crossref","unstructured":"Papandreou, G., Zhu, T., Chen, L.: Personlab: Person pose estimation and instance segmentation with a bottom-up, part-based, geometric embedding model. In: Proceedings of the European Conference on Computer Vision (ECCV). pp. 269\u2013286 (2018)","DOI":"10.1007\/978-3-030-01264-9_17"},{"key":"4256_CR12","doi-asserted-by":"crossref","unstructured":"Artacho, B., Savakis, A.: BAPose: Bottom-Up Pose Estimation with Disentangled Waterfall Representations. In: Proceedings of the IEEE Winter Conference on Applications of Computer Vision (CACV), pp. 528\u2013537 (2023)","DOI":"10.1109\/WACVW58289.2023.00059"},{"key":"4256_CR13","doi-asserted-by":"crossref","unstructured":"Cheng, Y., Wang, B., Yang B.: Monocular 3D multi-person pose estimation by integrating top-down and bottom-up networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 7649\u20137659 (2021)","DOI":"10.1109\/CVPR46437.2021.00756"},{"key":"4256_CR14","first-page":"6278","volume":"34","author":"D Wang","year":"2021","unstructured":"Wang, D., Zhang, S., Hua, G.: Robust pose estimation in crowded scenes with direct pose-level inference. Adv. Neural. Inf. Process. Syst. 34, 6278\u20136289 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"4256_CR15","doi-asserted-by":"crossref","unstructured":"Geng, Z., Sun, K., xiao, B.: Bottom-up human pose estimation via disentangled keypoint regression. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 14676\u201314686 (2021)","DOI":"10.1109\/CVPR46437.2021.01444"},{"key":"4256_CR16","doi-asserted-by":"crossref","unstructured":"Cao, Z., Simon, T., Wei, S.: Realtime multi-person 2d pose estimation using part affinity fields. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 7291\u20137299 (2017)","DOI":"10.1109\/CVPR.2017.143"},{"key":"4256_CR17","doi-asserted-by":"crossref","unstructured":"McNally, W., Vats, K., Wong, A.: Rethinking keypoints representations: Modeling keypoints and poses as objects for multi-person human pose estimation. In: Proceedings of European Conference on Computer Vision (ECCV), pp. 37\u201354 (2022)","DOI":"10.1007\/978-3-031-20068-7_3"},{"key":"4256_CR18","doi-asserted-by":"crossref","unstructured":"Xiao, Y., Wang, X., Yu, D.: Adaptivepose: Human parts as adaptive points. In: Proceedings of the AAAI Conference on Artificial Intelligence (AAAI), pp. 2813\u20132821 (2022)","DOI":"10.1609\/aaai.v36i3.20185"},{"key":"4256_CR19","doi-asserted-by":"crossref","unstructured":"Yao, J., Chen, J., Niu, L., Sheng, B.: Scene-aware human pose generation using transformer. In: Proceedings of the 31st ACM International Conference on Multimedia, pp. 2847\u20132855 (2023)","DOI":"10.1145\/3581783.3612439"},{"key":"4256_CR20","doi-asserted-by":"publisher","DOI":"10.1007\/s00371-021-02229-9","author":"S Zeghoud","year":"2022","unstructured":"Zeghoud, S., Ali, S.G., Ertugrul, E., Kamel, A., Sheng, B.: Real-time spatial normalization for dynamic gesture classification. Vis. Comput. (2022). https:\/\/doi.org\/10.1007\/s00371-021-02229-9","journal-title":"Vis. Comput."},{"key":"4256_CR21","doi-asserted-by":"crossref","unstructured":"Yu Q, Hao C, Yuan X, et al. Generalizable Articulated Object Perception with Superpoints. In: ICASSP 2025\u20132025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp.1\u20135 (2025)","DOI":"10.1109\/ICASSP49660.2025.10890874"},{"key":"4256_CR22","doi-asserted-by":"crossref","unstructured":"Yu X, Jiang H, Zhang L, et al. Towards Robust Category-level Articulation Pose Estimation via Integrated Differentiable Rendering. In: ICASSP 2025\u20132025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp.1\u20135 (2025)","DOI":"10.1109\/ICASSP49660.2025.10889272"},{"key":"4256_CR23","doi-asserted-by":"publisher","DOI":"10.1080\/10447318.2018.1543081","author":"A Kamel","year":"2019","unstructured":"Kamel, A., Liu, B., Li, P., Sheng, B.: An investigation of 3D human pose estimation for learning Tai Chi: a human factor perspective. Int. J. Hum.-Comput. Interact. (2019). https:\/\/doi.org\/10.1080\/10447318.2018.1543081","journal-title":"Int. J. Hum.-Comput. Interact."},{"key":"4256_CR24","doi-asserted-by":"publisher","DOI":"10.1016\/j.vrih.2023.07.002","author":"M Jiang","year":"2024","unstructured":"Jiang, M., Tian, Z., Yu, C., Shi, Y., Liu, L.: Intelligent 3D garment system of the human body based on deep spiking neural network. Virtual Reality Intell. Hardware (2024). https:\/\/doi.org\/10.1016\/j.vrih.2023.07.002","journal-title":"Virtual Reality Intell. Hardware"},{"key":"4256_CR25","doi-asserted-by":"crossref","unstructured":"Artacho, B., Savakis, A.: Unipose: Unified human pose estimation in single images and videos. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 7035\u20137044 (2020)","DOI":"10.1109\/CVPR42600.2020.00706"},{"key":"4256_CR26","doi-asserted-by":"crossref","unstructured":"Cheng, B., Xiao, B., Wang, J.: Higherhrnet: Scale-aware representation learning for bottom-up human pose estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 5386\u20135395 (2020)","DOI":"10.1109\/CVPR42600.2020.00543"},{"key":"4256_CR27","doi-asserted-by":"crossref","unstructured":"Luo, Z., Wang, Z., Huang, Y.: Rethinking the heatmap regression for bottom-up human pose estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 13264\u201313273 (2021)","DOI":"10.1109\/CVPR46437.2021.01306"},{"key":"4256_CR28","doi-asserted-by":"crossref","unstructured":"Zoph, B., Cubuk, D., Ghiasi, G.: Learning data augmentation strategies for object detection. In: Proceedings of European Conference on Computer Vision (ECCV), pp. 566\u2013583 (2020)","DOI":"10.1007\/978-3-030-58583-9_34"},{"issue":"6","key":"4256_CR29","first-page":"1049","volume":"13","author":"J Cheng","year":"2019","unstructured":"Cheng, J., Wang, Q., Yang, W.: Ssd object detection algorithm with multi-scale convolution feature fusion. J. Front. Comput. Sci. Technol. 13(6), 1049\u20131061 (2019)","journal-title":"J. Front. Comput. Sci. Technol."},{"key":"4256_CR30","doi-asserted-by":"crossref","unstructured":"Liu, Y., Yang, F., Hu, P.: Small-object detection in UAV-captured images via multi-branch parallel feature pyramid networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp. 145740\u2013145750 (2020)","DOI":"10.1109\/ACCESS.2020.3014910"},{"issue":"1","key":"4256_CR31","first-page":"149","volume":"38","author":"P Wang","year":"2021","unstructured":"Wang, P., Lu, Y., Zhan, T.: Small object detection algorithm based on PDSSD improved neural network. Comput. Appl. Softw. 38(1), 149\u2013156 (2021)","journal-title":"Comput. Appl. Softw."},{"issue":"4","key":"4256_CR32","first-page":"241","volume":"47","author":"Q Xi","year":"2021","unstructured":"Xi, Q., Zhang, D., Peng, L.: Small object detection algorithm based on improved dense network and quadratic regression. Comput. Eng. 47(4), 241\u2013247 (2021)","journal-title":"Comput. Eng."},{"key":"4256_CR33","doi-asserted-by":"crossref","unstructured":"Yan, S., Liu, Y., Wang, H., Du, X., Liu, M., Liu, H.: Cross-modal retrieval for motion and text via droptriple loss, ACM International Conference on Multimedia in Asia, pp. 1\u20137 (2023).","DOI":"10.1145\/3595916.3626459"},{"issue":"11","key":"4256_CR34","doi-asserted-by":"publisher","first-page":"11525","DOI":"10.1109\/TCSVT.2024.3421565","volume":"34","author":"S Yan","year":"2024","unstructured":"Yan, S., Liu, M., Wang, Y., Liu, Y., Liu, H.: MLP: motion label prior for temporal sentence localization in untrimmed 3D human motions. IEEE Trans. Circuits Syst. Video Technol. 34(11), 11525\u201311550 (2024)","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"key":"4256_CR35","unstructured":"Yan, S., Wang, Y., Du, X., Jin, H., Liu, M.: Improving Fine-grained Understanding for Retrieval in Human Motion and Text, IEEE Signal Processing Letters, pp. 1\u20135 (2024)."},{"key":"4256_CR36","doi-asserted-by":"crossref","unstructured":"Hou, Q., Zhou, D., Feng, J.: Coordinate attention for efficient mobile network design. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 13713\u201313722 (2021)","DOI":"10.1109\/CVPR46437.2021.01350"},{"key":"4256_CR37","unstructured":"Sun, K., Geng, Z., Meng, D.: Bottom-up human pose estimation by ranking heatmap-guided adaptive keypoints estimates. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 2006.15480 (2020)"},{"key":"4256_CR38","doi-asserted-by":"crossref","unstructured":"Jin, S., Liu, W.: Differentiable Hierarchical Graph Grouping for Multi-person Pose Estimation. In: Proceedings of European Conference on Computer Vision (ECCV), pp. 718\u2013734 (2020)","DOI":"10.1007\/978-3-030-58571-6_42"},{"key":"4256_CR39","doi-asserted-by":"crossref","unstructured":"Li, Y., Yang, S., Liu, P.: Simcc: A simple coordinate classification perspective for human pose estimation. In:Proceedings of European Conference on Computer Vision (ECCV), pp. 89\u2013106 (2022)","DOI":"10.1007\/978-3-031-20068-7_6"},{"key":"4256_CR40","doi-asserted-by":"crossref","unstructured":"Li, J., Wang, C., Zhu, H.: Crowdpose: Efficient crowded scenes pose estimation and a new benchmark. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 10863\u201310872 (2019)","DOI":"10.1109\/CVPR.2019.01112"},{"key":"4256_CR41","doi-asserted-by":"crossref","unstructured":"Wei, F., Sun, X., Li, H.: Point-set anchors for object detection, instance segmentation and pose estimation. In: Proceedings of European Conference on Computer Vision (ECCV), pp. 527\u2013544 (2020)","DOI":"10.1007\/978-3-030-58607-2_31"},{"key":"4256_CR42","unstructured":"Zhou, X., Wang, D., Kr\u00e4henb\u00fchl, P.: Objects as points. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 1904.07850 (2019)"},{"key":"4256_CR43","doi-asserted-by":"crossref","unstructured":"Tian, C., Yu, R., Zhao, X.: Posedet: fast multi-person pose estimation using pose embedding. In: Proceedings of 2021 16th IEEE International Conference on Automatic Face and Gesture Recognition, pp. 1\u20138 (2021)","DOI":"10.1109\/FG52635.2021.9667045"},{"key":"4256_CR44","doi-asserted-by":"crossref","unstructured":"Lin, T., Maire, M., Belongie, S.: Microsoft COCO: Common objects in context. In: Proceedings of Computer Vision\u2013ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6\u201312, 2014, Proceedings, Part V 13. Springer International Publishing, pp. 740\u2013755 (2014)","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"4256_CR45","doi-asserted-by":"crossref","unstructured":"Hu, J., Shen, L., Sun, G.: Squeeze-and-excitation networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 7132\u20137141 (2018)","DOI":"10.1109\/CVPR.2018.00745"},{"key":"4256_CR46","doi-asserted-by":"crossref","unstructured":"Kirillov, A., Mintun, E., Ravi, N.: Segment anything. In: Proceedings of the IEEE International Conference on Computer Vision (ICCV), pp. 4015\u20134026 (2023)","DOI":"10.1109\/ICCV51070.2023.00371"},{"key":"4256_CR47","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, Y.: Cbam: Convolutional block attention module. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 3\u201319 (2018)","DOI":"10.1007\/978-3-030-01234-2_1"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-025-04256-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-025-04256-2","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-025-04256-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,4]],"date-time":"2026-03-04T13:02:13Z","timestamp":1772629333000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-025-04256-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,7]]},"references-count":47,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,1]]}},"alternative-id":["4256"],"URL":"https:\/\/doi.org\/10.1007\/s00371-025-04256-2","relation":{"has-preprint":[{"id-type":"doi","id":"10.21203\/rs.3.rs-5034986\/v1","asserted-by":"object"}]},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,12,7]]},"assertion":[{"value":"5 September 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 October 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 December 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"24"}}